From 8629ba0904ba2a58e9d93d774b94586776333fc3 Mon Sep 17 00:00:00 2001
From: "juan.ledesma" <juan.ledesma@isciii.es>
Date: Thu, 6 Jun 2024 11:16:33 +0200
Subject: [PATCH 001/321] updated changelog

---
 CHANGELOG.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 10c775bbe..8c94a1423 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -15,6 +15,7 @@ Code contributions to the new version:
 - [Sarai Varona](https://github.com/svarona)
 - [Daniel Valle](https://github.com/Daniel-VM)
 - [Víctor López](https://github.com/victor5lm)
+- [Juan Ledesma](https://github.com/juanledesma78)
 
 ### Template fixes and updates
 
@@ -43,6 +44,7 @@ Code contributions to the new version:
 - Included annotated tab description in exome-trios markdowns [#273](https://github.com/BU-ISCIII/buisciii-tools/pull/273)
 - Installed all necessary singularity images and modified all templates so that, instead of using conda environments or loaded modules, the corresponding singularity images are used [#272](https://github.com/BU-ISCIII/buisciii-tools/pull/272)
 - Updated sarek version in exomeeb, exometrio and wgstrio templates [#277](https://github.com/BU-ISCIII/buisciii-tools/pull/277)
+- Change of extension file of all_samples_virus_table_filtered (from csv to tsv) in lablog_viralrecon_results [#278](https://github.com/BU-ISCIII/buisciii-tools/pull/278) 
 
 ### Modules
 

From f939f321b9430faee16bf469fe5fd970235ad256 Mon Sep 17 00:00:00 2001
From: "juan.ledesma" <juan.ledesma@isciii.es>
Date: Thu, 6 Jun 2024 10:48:07 +0200
Subject: [PATCH 002/321] extension file of all_samples_virus_table_filtered
 changed from csv to tsv to match pikavirus result table

---
 .../templates/viralrecon/RESULTS/lablog_viralrecon_results      | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results b/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
index e71f4294f..d229644b9 100755
--- a/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
+++ b/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
@@ -23,7 +23,7 @@ cat references.tmp | while read in; do ln -s ../../ANALYSIS/*/*${in}*/variants/i
 ln -s ../../ANALYSIS/*_MAG/99-stats/multiqc_report.html ./krona_results.html
 ln -s ../../ANALYSIS/*/mapping_illumina*.tab ./mapping_illumina.csv
 ln -s ../../ANALYSIS/*/assembly_stats.csv ./assembly_stats.csv
-ln -s ../../ANALYSIS/*/01-PikaVirus-results/all_samples_virus_table_filtered.csv ./pikavirus_table.csv
+ln -s ../../ANALYSIS/*/01-PikaVirus-results/all_samples_virus_table_filtered.tsv ./pikavirus_table.tsv
 
 #conda activate viralrecon_report
 echo "python ./excel_generator.py -r ./references.tmp --merge_lineage_files" > _01_generate_excel_files.sh

From cc9aa85dc317e8660ded92cc16f2fe14ac8d981c Mon Sep 17 00:00:00 2001
From: "juan.ledesma" <juan.ledesma@isciii.es>
Date: Thu, 6 Jun 2024 12:10:21 +0200
Subject: [PATCH 003/321] updated CHANGELOG

---
 CHANGELOG.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 8c94a1423..d30c41c22 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -44,7 +44,7 @@ Code contributions to the new version:
 - Included annotated tab description in exome-trios markdowns [#273](https://github.com/BU-ISCIII/buisciii-tools/pull/273)
 - Installed all necessary singularity images and modified all templates so that, instead of using conda environments or loaded modules, the corresponding singularity images are used [#272](https://github.com/BU-ISCIII/buisciii-tools/pull/272)
 - Updated sarek version in exomeeb, exometrio and wgstrio templates [#277](https://github.com/BU-ISCIII/buisciii-tools/pull/277)
-- Change of extension file of all_samples_virus_table_filtered (from csv to tsv) in lablog_viralrecon_results [#278](https://github.com/BU-ISCIII/buisciii-tools/pull/278) 
+- Extension file of all_samples_virus_table_filtered (from csv to tsv) in lablog_viralrecon_results changed [#278](https://github.com/BU-ISCIII/buisciii-tools/pull/278) 
 
 ### Modules
 

From 9d00f74649173c4897224ed1d368298ebf379b9f Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Thu, 6 Jun 2024 12:49:00 +0200
Subject: [PATCH 004/321] Python lint now only runs if .py files in PR

---
 .github/workflows/python_lint.yml | 24 ++++++++++++++++++++++--
 1 file changed, 22 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/python_lint.yml b/.github/workflows/python_lint.yml
index d121b7f32..503f3fe1b 100644
--- a/.github/workflows/python_lint.yml
+++ b/.github/workflows/python_lint.yml
@@ -3,10 +3,10 @@ name: python_lint
 on:
   push:
     paths:
-      - '**/*.py'
+      - '**.py'
   pull_request:
     paths:
-      - '**/*.py'
+      - '**.py'
 
 jobs:
   flake8_py3:
@@ -21,8 +21,18 @@ jobs:
         uses: actions/checkout@v2
       - name: Install flake8
         run: pip install flake8
+      - name: Check for Python file changes
+        id: file_check
+        run: |
+          git fetch origin ${{ github.base_ref }}
+          diff_pyfiles=$(git diff --name-only origin/${{ github.base_ref }} ${{ github.head_ref }} -- '*.py')
+          echo "::set-output name=diff_pyfiles::$diff_pyfiles"
       - name: Run flake8
+        if: steps.file_check.outputs.diff_pyfiles != ''
         run: flake8 --ignore E501,W503,E203,W605
+      - name: No Python files changed
+        if: steps.file_check.outputs.diff_pyfiles == ''
+        run: echo "No Python files have been changed."
 
   black_lint:
     runs-on: ubuntu-latest
@@ -31,5 +41,15 @@ jobs:
           uses: actions/checkout@v2
         - name: Install black in jupyter
           run: pip install black[jupyter]
+        - name: Check for Python file changes
+          id: file_check
+          run: |
+            git fetch origin ${{ github.base_ref }}
+            diff_pyfiles=$(git diff --name-only origin/${{ github.base_ref }} ${{ github.head_ref }} -- '*.py')
+            echo "::set-output name=diff_pyfiles::$diff_pyfiles"
         - name: Check code lints with Black
+          if: steps.file_check.outputs.diff_pyfiles != ''
           uses: psf/black@stable
+        - name: No Python files changed
+          if: steps.file_check.outputs.diff_pyfiles == ''
+          run: echo "No Python files have been changed."

From 9a7b8dd018c738155c9f92ff6618cf3f9d741a6d Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Thu, 6 Jun 2024 12:53:38 +0200
Subject: [PATCH 005/321] Updated CHANGELOG

---
 CHANGELOG.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index d30c41c22..baf416343 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -58,6 +58,8 @@ Code contributions to the new version:
 
 #### Changed
 
+- Forcing python lint to success if no .py files are in PR [#279](https://github.com/BU-ISCIII/buisciii-tools/pull/279)
+
 #### Removed
 
 ### Requirements

From 11892bb8accd3c3b866b4e9063fb5dd552230318 Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Thu, 6 Jun 2024 12:59:13 +0200
Subject: [PATCH 006/321] Removed restriction to pyfiles in lint workflow

---
 .github/workflows/python_lint.yml | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/python_lint.yml b/.github/workflows/python_lint.yml
index 503f3fe1b..34ce3efa8 100644
--- a/.github/workflows/python_lint.yml
+++ b/.github/workflows/python_lint.yml
@@ -2,11 +2,10 @@ name: python_lint
 
 on:
   push:
-    paths:
-      - '**.py'
+    branches: "**"
   pull_request:
-    paths:
-      - '**.py'
+    types: [opened, reopened, synchronize, closed]
+    branches: "**"
 
 jobs:
   flake8_py3:

From 9117bf167fc4f3ce6245e2b287ba3070127318fb Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Thu, 6 Jun 2024 13:10:12 +0200
Subject: [PATCH 007/321] Updated solution to stalled lint

---
 .github/workflows/python_lint.yml | 24 ++++++++++--------------
 1 file changed, 10 insertions(+), 14 deletions(-)

diff --git a/.github/workflows/python_lint.yml b/.github/workflows/python_lint.yml
index 34ce3efa8..df75b052a 100644
--- a/.github/workflows/python_lint.yml
+++ b/.github/workflows/python_lint.yml
@@ -17,38 +17,34 @@ jobs:
           python-version: 3.9.x
           architecture: x64
       - name: Checkout PyTorch
-        uses: actions/checkout@v2
+        uses: actions/checkout@v3
+          fetch-depth: 0
       - name: Install flake8
         run: pip install flake8
       - name: Check for Python file changes
         id: file_check
-        run: |
-          git fetch origin ${{ github.base_ref }}
-          diff_pyfiles=$(git diff --name-only origin/${{ github.base_ref }} ${{ github.head_ref }} -- '*.py')
-          echo "::set-output name=diff_pyfiles::$diff_pyfiles"
+        uses: tj-actions/changed-files@v33
       - name: Run flake8
-        if: steps.file_check.outputs.diff_pyfiles != ''
+        if: steps.file_check.outputs.any_changed == 'true'
         run: flake8 --ignore E501,W503,E203,W605
       - name: No Python files changed
-        if: steps.file_check.outputs.diff_pyfiles == ''
+        if: steps.file_check.outputs.any_changed != 'true'
         run: echo "No Python files have been changed."
 
   black_lint:
     runs-on: ubuntu-latest
     steps:
         - name: Setup
-          uses: actions/checkout@v2
+          uses: actions/checkout@v3
+            fetch-depth: 0
         - name: Install black in jupyter
           run: pip install black[jupyter]
         - name: Check for Python file changes
           id: file_check
-          run: |
-            git fetch origin ${{ github.base_ref }}
-            diff_pyfiles=$(git diff --name-only origin/${{ github.base_ref }} ${{ github.head_ref }} -- '*.py')
-            echo "::set-output name=diff_pyfiles::$diff_pyfiles"
+          uses: tj-actions/changed-files@v34
         - name: Check code lints with Black
-          if: steps.file_check.outputs.diff_pyfiles != ''
+          if: steps.file_check.outputs.any_changed == 'true'
           uses: psf/black@stable
         - name: No Python files changed
-          if: steps.file_check.outputs.diff_pyfiles == ''
+          if: steps.file_check.outputs.any_changed != 'true'
           run: echo "No Python files have been changed."

From 617ff6ad4aeb72f4932f54bbbbeba2b78342a4e3 Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Thu, 6 Jun 2024 13:11:53 +0200
Subject: [PATCH 008/321] Updated solution to stalled lint. test2

---
 .github/workflows/python_lint.yml | 2 --
 1 file changed, 2 deletions(-)

diff --git a/.github/workflows/python_lint.yml b/.github/workflows/python_lint.yml
index df75b052a..64645e0b6 100644
--- a/.github/workflows/python_lint.yml
+++ b/.github/workflows/python_lint.yml
@@ -18,7 +18,6 @@ jobs:
           architecture: x64
       - name: Checkout PyTorch
         uses: actions/checkout@v3
-          fetch-depth: 0
       - name: Install flake8
         run: pip install flake8
       - name: Check for Python file changes
@@ -36,7 +35,6 @@ jobs:
     steps:
         - name: Setup
           uses: actions/checkout@v3
-            fetch-depth: 0
         - name: Install black in jupyter
           run: pip install black[jupyter]
         - name: Check for Python file changes

From 8e8d1c8a313ded5d761ef15e428ede7f162b99e9 Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Thu, 6 Jun 2024 13:14:30 +0200
Subject: [PATCH 009/321] Updated solution to stalled lint. fetch-depth 0

---
 .github/workflows/python_lint.yml | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/python_lint.yml b/.github/workflows/python_lint.yml
index 64645e0b6..5aa19c41b 100644
--- a/.github/workflows/python_lint.yml
+++ b/.github/workflows/python_lint.yml
@@ -17,7 +17,8 @@ jobs:
           python-version: 3.9.x
           architecture: x64
       - name: Checkout PyTorch
-        uses: actions/checkout@v3
+        uses: actions/checkout@v2
+          fetch-depth: 0
       - name: Install flake8
         run: pip install flake8
       - name: Check for Python file changes
@@ -34,7 +35,8 @@ jobs:
     runs-on: ubuntu-latest
     steps:
         - name: Setup
-          uses: actions/checkout@v3
+          uses: actions/checkout@v2
+            fetch-depth: 0
         - name: Install black in jupyter
           run: pip install black[jupyter]
         - name: Check for Python file changes

From 0c7f8a9708e2ed32915805049ac713221582cf34 Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Thu, 6 Jun 2024 13:16:26 +0200
Subject: [PATCH 010/321] Updated solution to stalled lint. fixed1

---
 .github/workflows/python_lint.yml | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/.github/workflows/python_lint.yml b/.github/workflows/python_lint.yml
index 5aa19c41b..eb7625289 100644
--- a/.github/workflows/python_lint.yml
+++ b/.github/workflows/python_lint.yml
@@ -18,6 +18,7 @@ jobs:
           architecture: x64
       - name: Checkout PyTorch
         uses: actions/checkout@v2
+        with:
           fetch-depth: 0
       - name: Install flake8
         run: pip install flake8
@@ -36,6 +37,7 @@ jobs:
     steps:
         - name: Setup
           uses: actions/checkout@v2
+          with:
             fetch-depth: 0
         - name: Install black in jupyter
           run: pip install black[jupyter]

From 08e1fcaaac44b480a40d069f5ed6cbed7dc4afef Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Thu, 6 Jun 2024 13:19:46 +0200
Subject: [PATCH 011/321] Python linting test

---
 bu_isciii/scratch.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/scratch.py b/bu_isciii/scratch.py
index 5f04ccd93..5a0bbeae2 100755
--- a/bu_isciii/scratch.py
+++ b/bu_isciii/scratch.py
@@ -251,7 +251,7 @@ def remove_scratch(self):
             stderr.print(
                 "[red]ERROR: Directory "
                 + scratch_folder
-                + " not the same as "
+                + " is not the same as "
                 + self.scratch_tmp_path,
                 highlight=False,
             )

From f5f029d6d6b2cdf792183895ef3edf1b33509870 Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Thu, 6 Jun 2024 13:26:54 +0200
Subject: [PATCH 012/321] Updated solution to stalled lint. fixed2

---
 .github/workflows/python_lint.yml | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/.github/workflows/python_lint.yml b/.github/workflows/python_lint.yml
index eb7625289..aba4945fc 100644
--- a/.github/workflows/python_lint.yml
+++ b/.github/workflows/python_lint.yml
@@ -25,6 +25,10 @@ jobs:
       - name: Check for Python file changes
         id: file_check
         uses: tj-actions/changed-files@v33
+        with:
+          since_last_remote_commit: true
+          files: |
+             **.py
       - name: Run flake8
         if: steps.file_check.outputs.any_changed == 'true'
         run: flake8 --ignore E501,W503,E203,W605
@@ -44,6 +48,10 @@ jobs:
         - name: Check for Python file changes
           id: file_check
           uses: tj-actions/changed-files@v34
+          with:
+            since_last_remote_commit: true
+            files: |
+              **.py
         - name: Check code lints with Black
           if: steps.file_check.outputs.any_changed == 'true'
           uses: psf/black@stable

From 23b173c6aa0b50de88ee2c7196fbe7f2cde351e2 Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Thu, 6 Jun 2024 13:28:24 +0200
Subject: [PATCH 013/321] python linting test2

---
 bu_isciii/scratch.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/scratch.py b/bu_isciii/scratch.py
index 5a0bbeae2..d36dd8655 100755
--- a/bu_isciii/scratch.py
+++ b/bu_isciii/scratch.py
@@ -246,7 +246,7 @@ def remove_scratch(self):
             )
         else:
             log.error(
-                f"Directory path not the same as service resolution. Skip folder copy '{scratch_folder}'"
+                f"Directory path is not the same as service resolution. Skip folder copy '{scratch_folder}'"
             )
             stderr.print(
                 "[red]ERROR: Directory "

From 38c06c06aa65aea3d826ffadc49bdca935cf6bb2 Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Thu, 6 Jun 2024 13:42:54 +0200
Subject: [PATCH 014/321] python linting test3

---
 .github/workflows/python_lint.yml | 4 ++--
 bu_isciii/scratch.py              | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/python_lint.yml b/.github/workflows/python_lint.yml
index aba4945fc..f3bdcd225 100644
--- a/.github/workflows/python_lint.yml
+++ b/.github/workflows/python_lint.yml
@@ -26,7 +26,7 @@ jobs:
         id: file_check
         uses: tj-actions/changed-files@v33
         with:
-          since_last_remote_commit: true
+          sha: ${{ github.event.pull_request.head.sha }}
           files: |
              **.py
       - name: Run flake8
@@ -49,7 +49,7 @@ jobs:
           id: file_check
           uses: tj-actions/changed-files@v34
           with:
-            since_last_remote_commit: true
+            sha: ${{ github.event.pull_request.head.sha }}
             files: |
               **.py
         - name: Check code lints with Black
diff --git a/bu_isciii/scratch.py b/bu_isciii/scratch.py
index d36dd8655..d6a420e1b 100755
--- a/bu_isciii/scratch.py
+++ b/bu_isciii/scratch.py
@@ -241,7 +241,7 @@ def remove_scratch(self):
         if self.service_folder in scratch_folder:
             shutil.rmtree(scratch_folder)
             stderr.print(
-                "[green]Successfully removed the directory %s" % scratch_folder,
+                "[green]Successfully removed directory %s" % scratch_folder,
                 highlight=False,
             )
         else:

From b74549495a4215f45cbbc096698cadc1a3f37880 Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Thu, 6 Jun 2024 13:51:42 +0200
Subject: [PATCH 015/321] Updated diff-file checker version

---
 .github/workflows/python_lint.yml | 7 +++----
 bu_isciii/scratch.py              | 2 +-
 2 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/.github/workflows/python_lint.yml b/.github/workflows/python_lint.yml
index f3bdcd225..b373db7a6 100644
--- a/.github/workflows/python_lint.yml
+++ b/.github/workflows/python_lint.yml
@@ -24,7 +24,7 @@ jobs:
         run: pip install flake8
       - name: Check for Python file changes
         id: file_check
-        uses: tj-actions/changed-files@v33
+        uses: tj-actions/changed-files@v44
         with:
           sha: ${{ github.event.pull_request.head.sha }}
           files: |
@@ -47,11 +47,10 @@ jobs:
           run: pip install black[jupyter]
         - name: Check for Python file changes
           id: file_check
-          uses: tj-actions/changed-files@v34
+          uses: tj-actions/changed-files@v44
           with:
             sha: ${{ github.event.pull_request.head.sha }}
-            files: |
-              **.py
+            files: '**.py'
         - name: Check code lints with Black
           if: steps.file_check.outputs.any_changed == 'true'
           uses: psf/black@stable
diff --git a/bu_isciii/scratch.py b/bu_isciii/scratch.py
index d6a420e1b..9f2a9984f 100755
--- a/bu_isciii/scratch.py
+++ b/bu_isciii/scratch.py
@@ -201,7 +201,7 @@ def revert_copy_scratch(self):
                 except Exception as e:
                     stderr.print(e)
                     stderr.print(
-                        "[red]ERROR: Copy of the directory %s failed"
+                        "[red]ERROR: Copy of directory %s failed"
                         % self.scratch_tmp_path,
                         highlight=False,
                     )

From b632b0225b5efbe095b4c2f19540e7d023519226 Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Thu, 6 Jun 2024 13:54:37 +0200
Subject: [PATCH 016/321] Test commit without py files

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 9d597a7cc..122bb0708 100644
--- a/README.md
+++ b/README.md
@@ -72,7 +72,7 @@ Options:
   -u, --api_user TEXT        User for the API logging
   -p, --api_password TEXT    Password for the API logging
   -c, --cred_file TEXT       Config file with API logging credentials
-  --help                     Show this message and exit.
+  --help                     Show this message and exit
 
 Commands:
   list         List available bu-isciii services.

From 342067a95c9e334c08e9e9dc0a4bf0dc91db77cd Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Sara=20Monz=C3=B3n?= <sara.monzon.fdz@gmail.com>
Date: Tue, 4 Jun 2024 16:33:13 +0200
Subject: [PATCH 017/321] added versions dep to enviroment.yml file

---
 environment.yml | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/environment.yml b/environment.yml
index f21d9fe78..cdad4196c 100644
--- a/environment.yml
+++ b/environment.yml
@@ -1,5 +1,7 @@
 channels:
 - conda-forge
 dependencies:
-- wkhtmltopdf
-- tree
+- wkhtmltopdf>=0.12.4
+- tree>=2.0.2
+- pip>22.0.2
+- python>3.9

From 2c1be53f9975ecfb9eb82b85a347581ab592a38d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Sara=20Monz=C3=B3n?= <sara.monzon.fdz@gmail.com>
Date: Tue, 4 Jun 2024 16:33:59 +0200
Subject: [PATCH 018/321] removed path for loading wkhtmlpdf, and catched error
 when executable does not exist

---
 bu_isciii/bioinfo_doc.py | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index b4d0ab4ea..e863fce4e 100755
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -185,8 +185,13 @@ def __init__(
         )
         self.samples = self.resolution_info.get("samples", None)
         self.handled_services = None
-        path_to_wkhtmltopdf = os.path.normpath(self.conf["wkhtmltopdf_path"])
-        self.config_pdfkit = pdfkit.configuration(wkhtmltopdf=path_to_wkhtmltopdf)
+        try:
+            self.config_pdfkit = pdfkit.configuration()
+        except OSError as e:
+            stderr.print("[red] wkhtmlpdf executable was not found. Install it using conda environment.")
+            stderr.print(f"[red] Error: {e}")
+            sys.exit()
+
         if self.type == "service_info":
             self.template_file = self.conf["service_info_template_path_file"]
         else:
@@ -416,6 +421,7 @@ def convert_to_pdf(self, html_file):
             )
         except OSError as e:
             stderr.print("[red] Unable to convert to PDF")
+            stderr.print(f"[red] Error: {e}")
             log.exception("Unable to create pdf.", exc_info=e)
         return
 

From 3be8b0b0d96fe1f2f1be97fd288f299f7fcf55e5 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Sara=20Monz=C3=B3n?= <sara.monzon.fdz@gmail.com>
Date: Tue, 4 Jun 2024 16:34:34 +0200
Subject: [PATCH 019/321] removed wkhtmlpdf path from configs

---
 bu_isciii/conf/configuration.json     | 1 -
 bu_isciii/conf/configuration_dev.json | 1 -
 2 files changed, 2 deletions(-)

diff --git a/bu_isciii/conf/configuration.json b/bu_isciii/conf/configuration.json
index d133d3a50..d4e4f86ea 100755
--- a/bu_isciii/conf/configuration.json
+++ b/bu_isciii/conf/configuration.json
@@ -36,7 +36,6 @@
         "delivery_template_path_file": "templates/jinja_template_delivery.j2",
         "html_template_path_file": "templates/html_service_template.html",
         "path_to_css": "assets/css",
-        "wkhtmltopdf_path": "/data/bi/pipelines/miniconda3/envs/buisciii-tools/bin/wkhtmltopdf",
         "email_host": "mx2.isciii.es",
         "email_port": "587",
         "email_host_user": "bioinformatica@isciii.es",
diff --git a/bu_isciii/conf/configuration_dev.json b/bu_isciii/conf/configuration_dev.json
index 08d1fd262..68e948cb5 100755
--- a/bu_isciii/conf/configuration_dev.json
+++ b/bu_isciii/conf/configuration_dev.json
@@ -36,7 +36,6 @@
         "delivery_template_path_file": "templates/jinja_template_delivery.j2",
         "html_template_path_file": "templates/html_service_template.html",
         "path_to_css": "assets/css",
-        "wkhtmltopdf_path": "/data/bi/pipelines/miniconda3/envs/buisciii-tools/bin/wkhtmltopdf",
         "email_host": "mx2.isciii.es",
         "email_port": "587",
         "email_host_user": "bioinformatica@isciii.es",

From 662c30aead3b176eaf93792f744a253d1472cfe4 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Sara=20Monz=C3=B3n?= <sara.monzon.fdz@gmail.com>
Date: Tue, 4 Jun 2024 16:40:15 +0200
Subject: [PATCH 020/321] clarified readme install instructions

---
 README.md | 31 +++++++++++++++++++++----------
 1 file changed, 21 insertions(+), 10 deletions(-)

diff --git a/README.md b/README.md
index 122bb0708..138380a1a 100644
--- a/README.md
+++ b/README.md
@@ -7,9 +7,8 @@ BU-ISCIII provides a serie or services in its portfolio for supporting bioinform
 
 - [buisciii-tools](#buisciii-tools)
   - [Installation](#installation)
-    - [Bioconda](#bioconda)
-    - [Pip](#pip)
-    - [Development version](#development-version)
+    - [Micromamba and pip](#micromamba-and-pip)
+    - [Dev version](#dev-version)
   - [Usage](#usage)
     - [Command-line](#command-line)
       - [list](#list)
@@ -26,30 +25,42 @@ BU-ISCIII provides a serie or services in its portfolio for supporting bioinform
 
 ## Installation
 
-### Bioconda
+### Micromamba and pip
 
 ```bash
-conda create -n buisciii-tools pip
-conda activate 
-conda env update --file environment.yml
+micromamba create -n buisciii -f environment.yml
+micromamba activate buisciii
+pip install --force-reinstall --upgrade git+https://github.com/bu-isciii/buisciii-tools.git@main
 ```
 
-### Pip
+or
 
 ```bash
+git checkout main
+conda create -n buisciii -f environment.yml
 conda activate 
 pip install .
 ```
 
-### Development version
+### Dev version
 
 If you want to install the latest code in the repository:
 
 ```bash
-conda create -n buisciii_dev pip
+micromamba create -n buisciii_dev -f environment.yml
+micromamba activate buisciii_dev
 pip install --force-reinstall --upgrade git+https://github.com/bu-isciii/buisciii-tools.git@develop
 ```
 
+or locally:
+
+```bash
+git checkout develop
+micromamba create -n buisciii_dev -f environment.yml
+micromamba activate buisciii_dev
+pip install .
+```
+
 ## Usage
 
 ### Command-line

From dac62fa0bed78ce21c87f25090314b172641a32f Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Sara=20Monz=C3=B3n?= <sara.monzon.fdz@gmail.com>
Date: Tue, 4 Jun 2024 16:45:05 +0200
Subject: [PATCH 021/321] updated changelog

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index baf416343..95f6bbda5 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -51,6 +51,7 @@ Code contributions to the new version:
 #### Added enhancements
 
 - PR [#274](https://github.com/BU-ISCIII/buisciii-tools/pull/274): added `--dev` option, configuration dev and test folder structure.
+- PR [#276](https://github.com/BU-ISCIII/buisciii-tools/pull/276): wkhtmlpdf does not need absolute path to executable. Added better error handling when executable does not exists.
 
 #### Fixes
 

From ba47621fc5aa1774b831655e26f3984a1e7f0fd2 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Sara=20Monz=C3=B3n?= <sara.monzon.fdz@gmail.com>
Date: Tue, 4 Jun 2024 16:45:31 +0200
Subject: [PATCH 022/321] lintig

---
 bu_isciii/bioinfo_doc.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index e863fce4e..b598f344b 100755
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -188,7 +188,9 @@ def __init__(
         try:
             self.config_pdfkit = pdfkit.configuration()
         except OSError as e:
-            stderr.print("[red] wkhtmlpdf executable was not found. Install it using conda environment.")
+            stderr.print(
+                "[red] wkhtmlpdf executable was not found. Install it using conda environment."
+            )
             stderr.print(f"[red] Error: {e}")
             sys.exit()
 

From f67600e8f0806409074b3b49376ef3638d7ae940 Mon Sep 17 00:00:00 2001
From: jaimeozaez <135366362+jaimeozaez@users.noreply.github.com>
Date: Fri, 7 Jun 2024 11:50:34 +0200
Subject: [PATCH 023/321] Fixed clean module (#280)

* services.json modified in order to properly delete fitrimmed fastq les in assembly annotation

* self.service_samples modified in order to properly get list of service samples

* assembly files to delete modified in services.json

* services.json updated with mtbseq service info

* Modified purge_files function for avoiding repeated files in files_to_delete list

* Modified purge_files function for avoiding repeated files in files_to_delete list

* Relocated self.rename() method usage for _DEL renaming of purged folders. Now it is called when self.option = rename_nocopy

* delete_rename() function renamed to just delete()

* self.option rename_nocopy renamed to rename

* Reverted lasts commits

* Reverted some weird changes...

* Relocated self.rename() method usage for _DEL renaming of purged folders

* Renamed self.delete_rename() method. Now is self.delete()

* rename_nocopy option modified in just rename

* files to delete added to services.json for rnaseq service

* Updated CHANGELOG

* fixed linting

* Fixed linting
---
 CHANGELOG.md                      |  1 +
 bu_isciii/__main__.py             |  6 +++---
 bu_isciii/clean.py                | 30 ++++++++++++++++--------------
 bu_isciii/templates/services.json | 14 +++++++-------
 4 files changed, 27 insertions(+), 24 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 95f6bbda5..03484899d 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -56,6 +56,7 @@ Code contributions to the new version:
 #### Fixes
 
 - Fixed archive module. Updated correct header for scout tsv [#258](https://github.com/BU-ISCIII/buisciii-tools/pull/258).
+- Fixed clean module. Corrected purge_files function. Renaming stage moved from clean to rename_nocopy option. Updated services.json file with correct paths for some services. [#280](https://github.com/BU-ISCIII/buisciii-tools/pull/280)
 
 #### Changed
 
diff --git a/bu_isciii/__main__.py b/bu_isciii/__main__.py
index 3c3747612..012b3bb4a 100755
--- a/bu_isciii/__main__.py
+++ b/bu_isciii/__main__.py
@@ -307,7 +307,7 @@ def scratch(ctx, resolution, path, tmp_dir, direction, ask_path):
     type=click.Choice(
         [
             "full_clean",
-            "rename_nocopy",
+            "rename",
             "clean",
             "revert_renaming",
             "show_removable",
@@ -317,7 +317,7 @@ def scratch(ctx, resolution, path, tmp_dir, direction, ask_path):
     multiple=False,
     help=(
         "Select what to do inside the cleanning step: full_clean: delete files and folders to clean,"
-        " rename no copy and deleted folders, rename_nocopy: just rename no copy folders, clean: "
+        " rename no copy and deleted folders, rename: just rename folders, clean: "
         "delete files and folders to clean,"
         "revert_renaming: remove no_copy and delete tags,"
         "show_removable: list folders and files to remove "
@@ -447,7 +447,7 @@ def finish(ctx, resolution, path, ask_path, sftp_folder, tmp_dir):
         resolution,
         path,
         ask_path,
-        "rename_nocopy",
+        "rename",
         ctx.obj["api_user"],
         ctx.obj["api_password"],
         ctx.obj["conf"],
diff --git a/bu_isciii/clean.py b/bu_isciii/clean.py
index aeabff8db..3dba081c0 100644
--- a/bu_isciii/clean.py
+++ b/bu_isciii/clean.py
@@ -55,7 +55,9 @@ def __init__(
         self.services_requested = self.resolution_info["resolutions"][0][
             "available_services"
         ]
-        self.service_samples = self.resolution_info["samples"]
+        self.service_samples = [
+            sample_id["sample_name"] for sample_id in self.resolution_info["samples"]
+        ]
 
         if ask_path and path is None:
             stderr.print(
@@ -94,14 +96,13 @@ def __init__(
         self.delete_files = self.get_clean_items(self.services_to_clean, type="files")
         # self.delete_list = [item for item in self.delete_list if item]
         self.nocopy = self.get_clean_items(self.services_to_clean, type="no_copy")
-        self.service_samples = self.resolution_info.get("Samples", None)
 
         if option is None:
             self.option = bu_isciii.utils.prompt_selection(
                 "Options",
                 [
                     "full_clean",
-                    "rename_nocopy",
+                    "rename",
                     "clean",
                     "revert_renaming",
                     "show_removable",
@@ -312,10 +313,9 @@ def purge_files(self):
             files_to_delete = []
             for sample_info in self.service_samples:
                 for file in self.delete_files:
-                    file_to_delete = file.replace(
-                        "sample_name", sample_info["sample_name"]
-                    )
-                    files_to_delete.append(file_to_delete)
+                    file_to_delete = file.replace("sample_name", sample_info)
+                    if file_to_delete not in files_to_delete:
+                        files_to_delete.append(file_to_delete)
             path_content = self.scan_dirs(to_find=files_to_delete)
             for file in path_content:
                 os.remove(file)
@@ -371,7 +371,7 @@ def delete_work(self):
         else:
             stderr.print("There is no work folder here")
 
-    def delete_rename(self, verbose=True, sacredtexts=["lablog", "logs"], add="_DEL"):
+    def delete(self, verbose=True, sacredtexts=["lablog", "logs"], add="_DEL"):
         """
         Description:
             Remove both files and purge folders defined for the service, and rename to tag.
@@ -392,10 +392,8 @@ def delete_rename(self, verbose=True, sacredtexts=["lablog", "logs"], add="_DEL"
         # Purge folders
         if self.delete_folders != "":
             self.purge_folders(sacredtexts=sacredtexts, add=add, verbose=verbose)
-            # Rename to tag.
-            self.rename(add=add, to_find=self.delete_folders, verbose=verbose)
         else:
-            stderr.print("No folders to remove or rename")
+            stderr.print("No folders to remove")
         # Purge work
         self.delete_work()
         # Delete files
@@ -432,8 +430,10 @@ def full_clean(self):
         Perform and handle the whole cleaning of the service
         """
 
-        self.delete_rename()
+        self.delete()
         self.rename(to_find=self.nocopy, add="_NC", verbose=True)
+        if self.delete_folders != "":
+            self.rename(add="_DEL", to_find=self.delete_folders, verbose=True)
 
     def handle_clean(self):
         """
@@ -445,9 +445,11 @@ def handle_clean(self):
             self.show_nocopy()
         if self.option == "full_clean":
             self.full_clean()
-        if self.option == "rename_nocopy":
+        if self.option == "rename":
             self.rename(to_find=self.nocopy, add="_NC", verbose=True)
+            if self.delete_folders != "":
+                self.rename(add="_DEL", to_find=self.delete_folders, verbose=True)
         if self.option == "clean":
-            self.delete_rename()
+            self.delete()
         if self.option == "revert_renaming":
             self.revert_renaming()
diff --git a/bu_isciii/templates/services.json b/bu_isciii/templates/services.json
index 0e8e853b8..bb88dfafb 100755
--- a/bu_isciii/templates/services.json
+++ b/bu_isciii/templates/services.json
@@ -8,8 +8,8 @@
         "end": "",
         "description": "nf-core/bacass:  Simple bacterial assembly and annotation pipeline",
         "clean": {
-          "folders":["01-preprocessing/trimmed_sequences"],
-          "files":[]
+          "folders":[],
+          "files":["01-processing/fastp/sample_name_1.fastp.fastq.gz", "01-processing/fastp/sample_name_2.fastp.fastq.gz"]
         },
         "no_copy": ["RAW", "TMP", "latest"],
         "last_folder":"REFERENCES",
@@ -25,8 +25,8 @@
         "url": "https://github.com/ngs-fzb/MTBseq_source",
         "description": "Mycobacterium tuberculosis mapping, variant calling and detection of resistance using MTBseq",
         "clean": {
-          "folders":["01-preprocessing/trimmed_sequences", "Bam", "Mpileup"],
-          "files":[]
+          "folders":["Bam", "Mpileup"],
+          "files":["01-processing/fastp/sample_name_1.fastp.fastq.gz", "01-processing/fastp/sample_name_2.fastp.fastq.gz"]
         },
         "no_copy": ["RAW", "TMP"],
         "last_folder":"REFERENCES",
@@ -42,8 +42,8 @@
         "url": "https://github.com/ngs-fzb/MTBseq_source",
         "description": "Mycobacterium tuberculosis mapping, variant calling and detection of resistance using MTBseq",
         "clean": {
-          "folders":["01-preprocessing", "Bam", "Mpileup"],
-          "files":[]
+          "folders":["Bam", "Mpileup"],
+          "files":["01-processing/fastp/sample_name_1.fastp.fastq.gz", "01-processing/fastp/sample_name_2.fastp.fastq.gz"]
         },
         "no_copy": ["RAW", "TMP"],
         "last_folder":"REFERENCES",
@@ -146,7 +146,7 @@
         "description": "RNA-seq analysis",
         "clean": {
           "folders":[],
-          "files":[]
+          "files":["star_salmon/sample_name.Aligned.out.bam", "star_salmon/sample_name.Aligned.toTranscriptome.out.bam"]
         },
         "no_copy": ["RAW", "TMP"],
         "last_folder":"RESULTS",

From 5af33bb192d8f432c610cce778557a6524c60a35 Mon Sep 17 00:00:00 2001
From: jaimeozaez <135366362+jaimeozaez@users.noreply.github.com>
Date: Mon, 10 Jun 2024 20:56:45 +0200
Subject: [PATCH 024/321] Fixed autoclean-sftp function (#281)

* Added @click.pass_context before autoclean_sftp function

* Updated CHANGELOG.md

* removed tatus file
---
 CHANGELOG.md          | 1 +
 bu_isciii/__main__.py | 1 +
 2 files changed, 2 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 03484899d..ecfd10de8 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -57,6 +57,7 @@ Code contributions to the new version:
 
 - Fixed archive module. Updated correct header for scout tsv [#258](https://github.com/BU-ISCIII/buisciii-tools/pull/258).
 - Fixed clean module. Corrected purge_files function. Renaming stage moved from clean to rename_nocopy option. Updated services.json file with correct paths for some services. [#280](https://github.com/BU-ISCIII/buisciii-tools/pull/280)
+- Fixed autoclean-sftp function. [#281](https://github.com/BU-ISCIII/buisciii-tools/pull/281)
 
 #### Changed
 
diff --git a/bu_isciii/__main__.py b/bu_isciii/__main__.py
index 012b3bb4a..321bb172c 100755
--- a/bu_isciii/__main__.py
+++ b/bu_isciii/__main__.py
@@ -640,6 +640,7 @@ def archive(
     default=14,
     help="Integer, remove files older than a window of `-d [int]` days. Default 14 days.",
 )
+@click.pass_context
 def autoclean_sftp(ctx, sftp_folder, days):
     """Clean old sftp services"""
     sftp_clean = bu_isciii.autoclean_sftp.AutoremoveSftpService(

From ff90493b8a20c9848280d43553646f83e5253864 Mon Sep 17 00:00:00 2001
From: jaimeozaez <135366362+jaimeozaez@users.noreply.github.com>
Date: Wed, 12 Jun 2024 16:49:25 +0200
Subject: [PATCH 025/321] Fixed singularity-images path when updating pangolin
 database in lablog_viralrecon. (#282)

* Updated CHANGELOG.md

* removed tatus file

* Corrected singularity-images path when updating pangolin database

* Updated Changelog

* Added line break after prompted input

* Updated CHANGELOG
---
 CHANGELOG.md                                     |  3 ++-
 .../viralrecon/ANALYSIS/lablog_viralrecon        | 16 ++++++++--------
 2 files changed, 10 insertions(+), 9 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index ecfd10de8..77b146ea7 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -44,7 +44,8 @@ Code contributions to the new version:
 - Included annotated tab description in exome-trios markdowns [#273](https://github.com/BU-ISCIII/buisciii-tools/pull/273)
 - Installed all necessary singularity images and modified all templates so that, instead of using conda environments or loaded modules, the corresponding singularity images are used [#272](https://github.com/BU-ISCIII/buisciii-tools/pull/272)
 - Updated sarek version in exomeeb, exometrio and wgstrio templates [#277](https://github.com/BU-ISCIII/buisciii-tools/pull/277)
-- Extension file of all_samples_virus_table_filtered (from csv to tsv) in lablog_viralrecon_results changed [#278](https://github.com/BU-ISCIII/buisciii-tools/pull/278) 
+- Extension file of all_samples_virus_table_filtered (from csv to tsv) in lablog_viralrecon_results changed [#278](https://github.com/BU-ISCIII/buisciii-tools/pull/278)
+- Fixed singularity-images path when updating pangolin database in lablog_viralrecon. Added line break after prompted input. [#282](https://github.com/BU-ISCIII/buisciii-tools/pull/282)
 
 ### Modules
 
diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 58fa21704..916f3d7fb 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -65,10 +65,10 @@ update_pangolin() {
         echo -e "Pangolin database is UP TO DATE. \xE2\x9C\x85"
     else
         mkdir "$(date '+%Y%m%d')"
-        srun --partition short_idx singularity run -B ${PWD} /scratch/bi/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/
+        srun --partition short_idx singularity run -B ${PWD} /data/bi/pipelines/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/
         # log file creation
         echo -e "$(date +'%Y-%m-%d %H:%M:%S')\tmkdir $(date '+%Y%m%d')" >> $(date '+%Y%m%d')/log
-        echo -e "$(date +'%Y-%m-%d %H:%M:%S')\tsrun --partition short_idx singularity run -B ${PWD} /scratch/bi/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/)" >> $(date '+%Y%m%d')/log
+        echo -e "$(date +'%Y-%m-%d %H:%M:%S')\tsrun --partition short_idx singularity run -B ${PWD} /data/bi/pipelines/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/)" >> $(date '+%Y%m%d')/log
         echo_green "Pangolin database UPDATED."
     fi
     cd -
@@ -211,7 +211,7 @@ echo_bold "\nPlease specify the type of analysis."
 echo_bold "1. METAGENOMICS"
 echo_bold "2. AMPLICONS"
 while true; do
-    echo -ne "\e[1;38;5;220m"; read -n 1 ANALYSIS_TYPE; tput sgr0
+    echo -ne "\e[1;38;5;220m"; read -n 1 ANALYSIS_TYPE; tput sgr0; echo
     if [ "$ANALYSIS_TYPE" == "1" ]; then
         ANALYSIS_TYPE="METAGENOMIC"
         echo_green "$ANALYSIS_TYPE analysis selected."
@@ -230,7 +230,7 @@ echo_bold "\nPlease specify the method to be performed."
     echo_bold "2. De novo assemby"
     echo_bold "3. Both"
     while true; do
-        echo -ne "\e[1;38;5;220m"; read -n 1 method; tput sgr0
+        echo -ne "\e[1;38;5;220m"; read -n 1 method; tput sgr0; echo
         if [ "$method" == "1" ]; then
             echo_green "Mapping method selected."
             break
@@ -251,7 +251,7 @@ echo_bold "\nPlease specify the method to be performed."
 
 # Setting samples_ref.txt file
 echo
-read -p $'\e[1;37mIs samples_ref.txt file already prepared? [y/N]: \e[1;38;5;220m' -n 1 samples_ref_prepared; tput sgr0
+read -p $'\e[1;37mIs samples_ref.txt file already prepared? [y/N]: \e[1;38;5;220m' -n 1 samples_ref_prepared; tput sgr0; echo
 if [ "$samples_ref_prepared" == "y" ]; then 
     echo -e "File samples_ref.txt READY. \xE2\x9C\x85"
 else
@@ -260,7 +260,7 @@ else
     while [ -z "$host" ] || [ -z "$reference" ] || [ "$answer" = "n" ]; do
         read -p $'\e[1;37mPlease specify the host: \e[1;38;5;220m' host
         read -p $'\e[1;37mPlease specify the reference: \e[1;38;5;220m' reference
-        read -p $'\e[1;37mAre host [\e[1;38;5;220m'"${host^^}"$'\e[1;37m] and reference [\e[1;38;5;220m'"${reference}"$'\e[1;37m] correct? [Y/n]: \e[1;38;5;220m' -n 1 answer; tput sgr0
+        read -p $'\e[1;37mAre host [\e[1;38;5;220m'"${host^^}"$'\e[1;37m] and reference [\e[1;38;5;220m'"${reference}"$'\e[1;37m] correct? [Y/n]: \e[1;38;5;220m' -n 1 answer; tput sgr0; echo
     done
     while read in; do echo -e "${in}\t${reference}\t${host^^}" >> samples_ref.txt; done < samples_id.txt
     echo -e "File samples_ref.txt READY. \xE2\x9C\x85"
@@ -272,7 +272,7 @@ if [ "$ANALYSIS_TYPE" = "METAGENOMIC" ]; then
 
     # Nextclade is able to analyze monkeypox virus
     echo
-    read -p $'\e[1;37mDo the sequences correspond to monkeypox virus (MPV)? [y/N]: \e[1;38;5;220m' -n 1 monkeypox; tput sgr0
+    read -p $'\e[1;37mDo the sequences correspond to monkeypox virus (MPV)? [y/N]: \e[1;38;5;220m' -n 1 monkeypox; tput sgr0; echo
     if [ "$monkeypox" == "y" ]; then
 
         virus_tag='mpox'
@@ -291,7 +291,7 @@ else
     echo_bold "2. RSV"
     echo_bold "3. Other"
     while true; do
-        echo -ne "\e[1;38;5;220m"; read -n 1 virus_tag; tput sgr0
+        echo -ne "\e[1;38;5;220m"; read -n 1 virus_tag; tput sgr0; echo
         if [ "$virus_tag" == "1" ]; then
             virus_tag="sars-cov-2"
             echo_green "${virus_tag^^} virus selected."

From 9e9ce3af63b5c0f9184540a0ef9ce651a8498694 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Mon, 10 Jun 2024 16:13:26 +0200
Subject: [PATCH 026/321] Updated CHANGELOG.md

---
 tatus | 2 ++
 1 file changed, 2 insertions(+)
 create mode 100644 tatus

diff --git a/tatus b/tatus
new file mode 100644
index 000000000..6f1a1d8db
--- /dev/null
+++ b/tatus
@@ -0,0 +1,2 @@
+* [32mdevelop[m
+  main[m

From 7771433ce8489976b80c0d8e20ba794f368620f7 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Mon, 10 Jun 2024 16:25:51 +0200
Subject: [PATCH 027/321] removed tatus file

---
 tatus | 2 --
 1 file changed, 2 deletions(-)
 delete mode 100644 tatus

diff --git a/tatus b/tatus
deleted file mode 100644
index 6f1a1d8db..000000000
--- a/tatus
+++ /dev/null
@@ -1,2 +0,0 @@
-* [32mdevelop[m
-  main[m

From 9173ce5788a31a888cbc13e8e9b1b46bfc65f5fc Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 13 Jun 2024 15:42:02 +0200
Subject: [PATCH 028/321] Fixed conflict

---
 CHANGELOG.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 77b146ea7..084e38884 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -45,7 +45,11 @@ Code contributions to the new version:
 - Installed all necessary singularity images and modified all templates so that, instead of using conda environments or loaded modules, the corresponding singularity images are used [#272](https://github.com/BU-ISCIII/buisciii-tools/pull/272)
 - Updated sarek version in exomeeb, exometrio and wgstrio templates [#277](https://github.com/BU-ISCIII/buisciii-tools/pull/277)
 - Extension file of all_samples_virus_table_filtered (from csv to tsv) in lablog_viralrecon_results changed [#278](https://github.com/BU-ISCIII/buisciii-tools/pull/278)
+<<<<<<< HEAD
 - Fixed singularity-images path when updating pangolin database in lablog_viralrecon. Added line break after prompted input. [#282](https://github.com/BU-ISCIII/buisciii-tools/pull/282)
+=======
+- Fixed singularity-images path when updating pangolin database in lablog_viralrecon. [#282](https://github.com/BU-ISCIII/buisciii-tools/pull/282)
+>>>>>>> c4bd14e (Updated Changelog)
 
 ### Modules
 

From dfaf61719b3c9cbd2ae863f59085765b69f7276c Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 13 Jun 2024 15:42:43 +0200
Subject: [PATCH 029/321] Fixed conflict

---
 CHANGELOG.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 084e38884..cb1647768 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -46,10 +46,14 @@ Code contributions to the new version:
 - Updated sarek version in exomeeb, exometrio and wgstrio templates [#277](https://github.com/BU-ISCIII/buisciii-tools/pull/277)
 - Extension file of all_samples_virus_table_filtered (from csv to tsv) in lablog_viralrecon_results changed [#278](https://github.com/BU-ISCIII/buisciii-tools/pull/278)
 <<<<<<< HEAD
+<<<<<<< HEAD
 - Fixed singularity-images path when updating pangolin database in lablog_viralrecon. Added line break after prompted input. [#282](https://github.com/BU-ISCIII/buisciii-tools/pull/282)
 =======
 - Fixed singularity-images path when updating pangolin database in lablog_viralrecon. [#282](https://github.com/BU-ISCIII/buisciii-tools/pull/282)
 >>>>>>> c4bd14e (Updated Changelog)
+=======
+- Fixed singularity-images path when updating pangolin database in lablog_viralrecon. Added line break after prompted input. [#282](https://github.com/BU-ISCIII/buisciii-tools/pull/282)
+>>>>>>> a7da8ac (Updated CHANGELOG)
 
 ### Modules
 

From fb05f50ce1e4c590289931cada29a62705320e9a Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 13 Jun 2024 15:44:46 +0200
Subject: [PATCH 030/321] Fixed conflict

---
 CHANGELOG.md | 8 +-------
 1 file changed, 1 insertion(+), 7 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index cb1647768..41f02fae5 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -45,15 +45,9 @@ Code contributions to the new version:
 - Installed all necessary singularity images and modified all templates so that, instead of using conda environments or loaded modules, the corresponding singularity images are used [#272](https://github.com/BU-ISCIII/buisciii-tools/pull/272)
 - Updated sarek version in exomeeb, exometrio and wgstrio templates [#277](https://github.com/BU-ISCIII/buisciii-tools/pull/277)
 - Extension file of all_samples_virus_table_filtered (from csv to tsv) in lablog_viralrecon_results changed [#278](https://github.com/BU-ISCIII/buisciii-tools/pull/278)
-<<<<<<< HEAD
-<<<<<<< HEAD
 - Fixed singularity-images path when updating pangolin database in lablog_viralrecon. Added line break after prompted input. [#282](https://github.com/BU-ISCIII/buisciii-tools/pull/282)
-=======
-- Fixed singularity-images path when updating pangolin database in lablog_viralrecon. [#282](https://github.com/BU-ISCIII/buisciii-tools/pull/282)
->>>>>>> c4bd14e (Updated Changelog)
-=======
 - Fixed singularity-images path when updating pangolin database in lablog_viralrecon. Added line break after prompted input. [#282](https://github.com/BU-ISCIII/buisciii-tools/pull/282)
->>>>>>> a7da8ac (Updated CHANGELOG)
+
 
 ### Modules
 

From d02b8fc41c9ae9f942d3e51f84c997a71514ff82 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 13 Jun 2024 15:56:14 +0200
Subject: [PATCH 031/321] Modified 02-preprocessing/lablog in snippy template
 in order to properly find trimmed reads from bacass pipeline

---
 .../ANALYSIS01_SNIPPY/02-preprocessing/lablog | 25 +++++++++++++++----
 1 file changed, 20 insertions(+), 5 deletions(-)

diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/02-preprocessing/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/02-preprocessing/lablog
index 70183be4e..23216d1af 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/02-preprocessing/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/02-preprocessing/lablog
@@ -1,11 +1,26 @@
 # module load singularity
 
 # if assembly pipeline was performed first and the trimmed sequences were saved, this should work:
-# cat ../samples_id | xargs -I mkdir @@; cd $_; ln -s ../../*/01-preprocessing/trimmed_sequences/@@*.gz @@; cd -
-# else: 
+read -p $'\e[1;37mDid you save the trimmed reads from previous assembly pipeline? [y/N]: \e[1;38;5;220m' -n 1 answer; tput sgr0; echo
+    if [ "$answer" == "y" ]; then
+        echo "Creating links to trimmed reads..."
 
-mkdir logs
+        while read in; do
+        mkdir ${in}
+        cd ${in}
+        ln -s ../../../*/01-processing/fastp/${in}_1.fastp.fastq.gz ${in}_R1_filtered.fastq.gz
+        ln -s ../../../*/01-processing/fastp/${in}_2.fastp.fastq.gz ${in}_R2_filtered.fastq.gz
+        cd -
+        done < ../samples_id.txt
 
-scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
+        echo -e "\e[32mLinks for $(cat ../samples_id.txt | wc -l) samples succesfully created.\e[0m"
+    
+    else
 
-cat ../samples_id.txt | xargs -I @@ echo "mkdir @@; srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name FP.@@ --output logs/FP.@@.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/bi/pipelines/singularity-images/fastp:0.20.0--hdbcaa40_0 fastp --in1 ${scratch_dir}/../00-reads/@@_R1.fastq.gz --in2 ${scratch_dir}/../00-reads/@@_R2.fastq.gz --thread 5 --cut_front --cut_tail --cut_mean_quality 15 --qualified_quality_phred 15 --trim_poly_x --detect_adapter_for_pe --json ${scratch_dir}/@@/@@_fastp.json --html ${scratch_dir}/@@/@@_fastp.html --out1 ${scratch_dir}/@@/@@_R1_filtered.fastq.gz --out2 ${scratch_dir}/@@/@@_R2_filtered.fastq.gz &" > _01_fastp.sh
+        mkdir logs
+        scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
+        cat ../samples_id.txt | xargs -I @@ echo "mkdir @@; srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name FP.@@ --output logs/FP.@@.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/bi/pipelines/singularity-images/fastp:0.20.0--hdbcaa40_0 fastp --in1 ${scratch_dir}/../00-reads/@@_R1.fastq.gz --in2 ${scratch_dir}/../00-reads/@@_R2.fastq.gz --thread 5 --cut_front --cut_tail --cut_mean_quality 15 --qualified_quality_phred 15 --trim_poly_x --detect_adapter_for_pe --json ${scratch_dir}/@@/@@_fastp.json --html ${scratch_dir}/@@/@@_fastp.html --out1 ${scratch_dir}/@@/@@_R1_filtered.fastq.gz --out2 ${scratch_dir}/@@/@@_R2_filtered.fastq.gz &" > _01_fastp.sh
+
+        echo -e "\e[32mFile _01_fastp.sh ready.\e[0m"
+        
+    fi
\ No newline at end of file

From 11e4f0e9de4900c1dc23d440b14d25d2b709662f Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 13 Jun 2024 16:01:44 +0200
Subject: [PATCH 032/321] Modified 01-preprocessing/lablog in characterization
 template in order to properly find trimmed reads from bacass pipeline

---
 .../01-preprocessing/lablog                   | 32 +++++++++++++++----
 1 file changed, 26 insertions(+), 6 deletions(-)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/01-preprocessing/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/01-preprocessing/lablog
index b7532e2bf..d1d3eb738 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/01-preprocessing/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/01-preprocessing/lablog
@@ -1,7 +1,27 @@
-# module load singularity 
+# module load singularity
+
 # if assembly pipeline was performed first and the trimmed sequences were saved, this should work:
-# cat ../samples_id.txt | xargs -I @@ mkdir @@; cd @@; ln -s ../../../*/01-processing/fastp/@@_1.fastp.fastq.gz ./@@_R1_filtered.fastq.gz; ln -s ../../../*/01-processing/fastp/@@_2.fastp.fastq.gz ./@@_R2_filtered.fastq.gz ; cd -
-# else: 
-mkdir logs
-scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
-cat ../samples_id.txt | xargs -I @@ echo "mkdir @@; srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name FP.@@ --output logs/FP.@@.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/bi/pipelines/singularity-images/fastp:0.20.0--hdbcaa40_0 fastp --in1 ${scratch_dir}/../00-reads/@@_R1.fastq.gz --in2 ${scratch_dir}/../00-reads/@@_R2.fastq.gz --thread 5 --cut_front --cut_tail --cut_mean_quality 15 --qualified_quality_phred 15 --trim_poly_x --detect_adapter_for_pe --json ${scratch_dir}/@@/@@_fastp.json --html ${scratch_dir}/@@/@@_fastp.html --out1 ${scratch_dir}/@@/@@_R1_filtered.fastq.gz --out2 ${scratch_dir}/@@/@@_R2_filtered.fastq.gz &" > _01_fastp.sh
+read -p $'\e[1;37mDid you save the trimmed reads from previous assembly pipeline? [y/N]: \e[1;38;5;220m' -n 1 answer; tput sgr0; echo
+    if [ "$answer" == "y" ]; then
+        echo "Creating links to trimmed reads..."
+
+        while read in; do
+        mkdir ${in}
+        cd ${in}
+        ln -s ../../../*/01-processing/fastp/${in}_1.fastp.fastq.gz ${in}_R1_filtered.fastq.gz
+        ln -s ../../../*/01-processing/fastp/${in}_2.fastp.fastq.gz ${in}_R2_filtered.fastq.gz
+        cd -
+        done < ../samples_id.txt
+
+        echo -e "\e[32mLinks for $(cat ../samples_id.txt | wc -l) samples succesfully created.\e[0m"
+    
+    else 
+        echo "Preparing _01_fastp.sh file for trimming..."
+        
+        mkdir logs
+        scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
+        cat ../samples_id.txt | xargs -I @@ echo "mkdir @@; srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name FP.@@ --output logs/FP.@@.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/bi/pipelines/singularity-images/fastp:0.20.0--hdbcaa40_0 fastp --in1 ${scratch_dir}/../00-reads/@@_R1.fastq.gz --in2 ${scratch_dir}/../00-reads/@@_R2.fastq.gz --thread 5 --cut_front --cut_tail --cut_mean_quality 15 --qualified_quality_phred 15 --trim_poly_x --length_required 50 --detect_adapter_for_pe --json ${scratch_dir}/@@/@@_fastp.json --html ${scratch_dir}/@@/@@_fastp.html --out1 ${scratch_dir}/@@/@@_R1_filtered.fastq.gz --out2 ${scratch_dir}/@@/@@_R2_filtered.fastq.gz --unpaired1 ${scratch_dir}/@@/@@_R1_unpaired.fastq.gz --unpaired2 ${scratch_dir}/@@/@@_R2_unpaired.fastq.gz &" > _01_fastp.sh
+
+	echo -e "\e[32mFile _01_fastp.sh ready.\e[0m"
+
+    fi
\ No newline at end of file

From 92ce0c085883d021969224b37bab36669fe6e53b Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 13 Jun 2024 16:04:32 +0200
Subject: [PATCH 033/321] Removed not needed lines

---
 .../templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/lablog     | 7 -------
 1 file changed, 7 deletions(-)

diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/lablog
index 3c03fe884..1b53edc41 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/lablog
@@ -1,10 +1,3 @@
-mkdir 01-fastqc
-mkdir 02-preprocessing
-mkdir 03-preprocQC
-mkdir 04-snippy
-mkdir 05-iqtree
-mkdir 99-stats
-
 ln -s ../samples_id.txt .
 ln -s ../00-reads .
 

From 3e373ac35c254915e928fadb9b33863aade2bd3a Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 13 Jun 2024 16:28:04 +0200
Subject: [PATCH 034/321] Corrected path to phylo.aln file in iqtree lablog

---
 .../snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog        | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog
index 95a2c4830..e351131c1 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog
@@ -2,5 +2,5 @@
 
 scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
 mkdir logs
-#echo "srun --chdir \${scratch_dir} --output logs/IQTREEMFP.%j.log --job-name IQTREEMFP --cpus-per-task 20 --mem 5G --partition short_idx --time 00:30:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../07-snphylo/snphylo.output.fasta -m MFP &" > _00_iqtreemfp.sh
-echo "srun --chdir ${scratch_dir} --output logs/IQTREEFULLALIGN.%j.log --job-name IQTREEFULLALIGN --cpus-per-task 20 --mem 15G --partition short_idx --time 08:00:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../07-snphylo/snphylo.output.fasta -m PMB+F+R2 -T 20 -B 1000 -pre phylo.iqtree.bootstrap &" > _01_iqtreeall.sh
+#echo "srun --chdir \${scratch_dir} --output logs/IQTREEMFP.%j.log --job-name IQTREEMFP --cpus-per-task 20 --mem 5G --partition short_idx --time 00:30:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../04-snippy/phylo.aln -m MFP &" > _00_iqtreemfp.sh
+echo "srun --chdir ${scratch_dir} --output logs/IQTREEFULLALIGN.%j.log --job-name IQTREEFULLALIGN --cpus-per-task 20 --mem 15G --partition short_idx --time 08:00:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../04-snippy/phylo.aln -m PMB+F+R2 -T 20 -B 1000 -pre phylo.iqtree.bootstrap &" > _01_iqtreeall.sh

From d1611ccf0d8ca039b0fb2a30f320b5f164e74353 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 13 Jun 2024 16:34:36 +0200
Subject: [PATCH 035/321] Updated Changelog

---
 CHANGELOG.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 41f02fae5..f956ef2e7 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -46,7 +46,7 @@ Code contributions to the new version:
 - Updated sarek version in exomeeb, exometrio and wgstrio templates [#277](https://github.com/BU-ISCIII/buisciii-tools/pull/277)
 - Extension file of all_samples_virus_table_filtered (from csv to tsv) in lablog_viralrecon_results changed [#278](https://github.com/BU-ISCIII/buisciii-tools/pull/278)
 - Fixed singularity-images path when updating pangolin database in lablog_viralrecon. Added line break after prompted input. [#282](https://github.com/BU-ISCIII/buisciii-tools/pull/282)
-- Fixed singularity-images path when updating pangolin database in lablog_viralrecon. Added line break after prompted input. [#282](https://github.com/BU-ISCIII/buisciii-tools/pull/282)
+- Updated characterization and snippy templates to fit bacass pipeline. Corrected path in 05-iqtree in snippy template. [#283](https://github.com/BU-ISCIII/buisciii-tools/pull/283)
 
 
 ### Modules

From 730489fce7e4c3a488565b0bb25514bc267a4a85 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Fri, 17 May 2024 15:39:37 +0200
Subject: [PATCH 036/321] Created RESULTS/lablog files where needed so that
 multiqc_report.html is included in the RESULTS folder

---
 .../lowfreq_panel/RESULTS/lablog_lowfreq_panel_results   | 9 +++++++++
 .../RESULTS/lablog_mtbseq_assembly_results               | 9 +++++++++
 bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results | 9 +++++++++
 3 files changed, 27 insertions(+)
 create mode 100644 bu_isciii/templates/lowfreq_panel/RESULTS/lablog_lowfreq_panel_results
 create mode 100644 bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results
 create mode 100644 bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results

diff --git a/bu_isciii/templates/lowfreq_panel/RESULTS/lablog_lowfreq_panel_results b/bu_isciii/templates/lowfreq_panel/RESULTS/lablog_lowfreq_panel_results
new file mode 100644
index 000000000..cf16f5308
--- /dev/null
+++ b/bu_isciii/templates/lowfreq_panel/RESULTS/lablog_lowfreq_panel_results
@@ -0,0 +1,9 @@
+DELIVERY_FOLDER="$(date '+%Y%m%d')_entrega"
+
+mkdir $DELIVERY_FOLDER
+
+# Lowfreq_panel service
+cd $DELIVERY_FOLDER
+
+# Links to reports
+ln -s ../../../ANALYSIS/*RBPANEL/99-stats/multiqc_report.html .
diff --git a/bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results b/bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results
new file mode 100644
index 000000000..3e60aec88
--- /dev/null
+++ b/bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results
@@ -0,0 +1,9 @@
+DELIVERY_FOLDER="$(date '+%Y%m%d')_entrega"
+
+mkdir $DELIVERY_FOLDER
+
+# Assembly service
+cd $DELIVERY_FOLDER
+
+# Links to reports
+ln -s ../../../ANALYSIS/*ASSEMBLY/99-stats/MultiQC/multiqc_report.html .
diff --git a/bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results b/bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results
new file mode 100644
index 000000000..55199d71e
--- /dev/null
+++ b/bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results
@@ -0,0 +1,9 @@
+DELIVERY_FOLDER="$(date '+%Y%m%d')_entrega"
+
+mkdir $DELIVERY_FOLDER
+
+# Assembly service
+cd $DELIVERY_FOLDER
+
+# Links to reports
+ln -s ../../../ANALYSIS/*RNASEQ/*rnaseq/multiqc/star_salmon/multiqc_report.html .

From c0043ae975ab63a2549b75913d6b6e7d2670c172 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Fri, 17 May 2024 15:44:10 +0200
Subject: [PATCH 037/321] Updated RESULTS/lablog files

---
 .../mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results      | 2 +-
 bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results        | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results b/bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results
index 3e60aec88..07babd5a3 100644
--- a/bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results
+++ b/bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results
@@ -2,7 +2,7 @@ DELIVERY_FOLDER="$(date '+%Y%m%d')_entrega"
 
 mkdir $DELIVERY_FOLDER
 
-# Assembly service
+# MTBSEQ-ASSEMBLY service
 cd $DELIVERY_FOLDER
 
 # Links to reports
diff --git a/bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results b/bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results
index 55199d71e..e05201ead 100644
--- a/bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results
+++ b/bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results
@@ -2,7 +2,7 @@ DELIVERY_FOLDER="$(date '+%Y%m%d')_entrega"
 
 mkdir $DELIVERY_FOLDER
 
-# Assembly service
+# RNASEQ service
 cd $DELIVERY_FOLDER
 
 # Links to reports

From 9cf3c173434b63d085b923cb48a5af08c70f4896 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Fri, 14 Jun 2024 15:46:51 +0200
Subject: [PATCH 038/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index f956ef2e7..7a728ca18 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -47,7 +47,7 @@ Code contributions to the new version:
 - Extension file of all_samples_virus_table_filtered (from csv to tsv) in lablog_viralrecon_results changed [#278](https://github.com/BU-ISCIII/buisciii-tools/pull/278)
 - Fixed singularity-images path when updating pangolin database in lablog_viralrecon. Added line break after prompted input. [#282](https://github.com/BU-ISCIII/buisciii-tools/pull/282)
 - Updated characterization and snippy templates to fit bacass pipeline. Corrected path in 05-iqtree in snippy template. [#283](https://github.com/BU-ISCIII/buisciii-tools/pull/283)
-
+- Included multiqc_report.html in RESULTS folder in every service, where necessary [#265] (https://github.com/BU-ISCIII/buisciii-tools/pull/265)
 
 ### Modules
 

From b1dc18fcb5b6f2749b0a7bd10b6f8e344c49ce27 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 17 Jun 2024 11:14:38 +0200
Subject: [PATCH 039/321] Fixed paths for symlink creation

---
 .../lowfreq_panel/RESULTS/lablog_lowfreq_panel_results          | 2 +-
 .../mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results      | 2 +-
 bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results        | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/bu_isciii/templates/lowfreq_panel/RESULTS/lablog_lowfreq_panel_results b/bu_isciii/templates/lowfreq_panel/RESULTS/lablog_lowfreq_panel_results
index cf16f5308..6f41d3987 100644
--- a/bu_isciii/templates/lowfreq_panel/RESULTS/lablog_lowfreq_panel_results
+++ b/bu_isciii/templates/lowfreq_panel/RESULTS/lablog_lowfreq_panel_results
@@ -6,4 +6,4 @@ mkdir $DELIVERY_FOLDER
 cd $DELIVERY_FOLDER
 
 # Links to reports
-ln -s ../../../ANALYSIS/*RBPANEL/99-stats/multiqc_report.html .
+ln -s ../../ANALYSIS/*RBPANEL/99-stats/multiqc_report.html .
diff --git a/bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results b/bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results
index 07babd5a3..d2bf377f2 100644
--- a/bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results
+++ b/bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results
@@ -6,4 +6,4 @@ mkdir $DELIVERY_FOLDER
 cd $DELIVERY_FOLDER
 
 # Links to reports
-ln -s ../../../ANALYSIS/*ASSEMBLY/99-stats/MultiQC/multiqc_report.html .
+ln -s ../../ANALYSIS/*ASSEMBLY/99-stats/MultiQC/multiqc_report.html .
diff --git a/bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results b/bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results
index e05201ead..caa8f8684 100644
--- a/bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results
+++ b/bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results
@@ -6,4 +6,4 @@ mkdir $DELIVERY_FOLDER
 cd $DELIVERY_FOLDER
 
 # Links to reports
-ln -s ../../../ANALYSIS/*RNASEQ/*rnaseq/multiqc/star_salmon/multiqc_report.html .
+ln -s ../../ANALYSIS/*RNASEQ/*rnaseq/multiqc/star_salmon/multiqc_report.html .

From 819d3d2b6fdf2650faa78bb1f656627d65543314 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 18 Jun 2024 10:20:13 +0200
Subject: [PATCH 040/321] Modified viralrecon results lablog to make symlinks
 to the /*_mapping/multiqc/ html reports

---
 bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results b/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
index d229644b9..4e691b91a 100755
--- a/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
+++ b/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
@@ -20,6 +20,7 @@ cat references.tmp | while read in; do cd excel_files_${in}; ln -s ../../../ANAL
 #Create symbolic links to files that are going to be converted to excel
 cat references.tmp | while read in; do ln -s ../../ANALYSIS/*/*${in}*/variants/ivar/variants_long_table.csv ${in}_variants_long_table.csv; done
 
+for ref in $(cut -f2 ../../ANALYSIS/samples_ref.txt | sort | uniq); do for organism in $(cut -f3 ../../ANALYSIS/samples_ref.txt | tr '[:lower:]' '[:upper:]' | sort | uniq); do report="../../ANALYSIS/*_${organism}/${ref}_*_viralrecon_mapping/multiqc/multiqc_report.html"; if [ -e $report ]; then ln -s ${report} ./multiqc_report_${ref}_${organism}.html; fi; done; done
 ln -s ../../ANALYSIS/*_MAG/99-stats/multiqc_report.html ./krona_results.html
 ln -s ../../ANALYSIS/*/mapping_illumina*.tab ./mapping_illumina.csv
 ln -s ../../ANALYSIS/*/assembly_stats.csv ./assembly_stats.csv

From 4a10dca3674084dce97d0d3867e638a0f93b589d Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 18 Jun 2024 13:02:46 +0200
Subject: [PATCH 041/321] Completed rnaseq results lablog

---
 .../templates/rnaseq/RESULTS/lablog_rnaseq_results   | 12 +++++++++++-
 1 file changed, 11 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results b/bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results
index caa8f8684..c6c075df8 100644
--- a/bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results
+++ b/bu_isciii/templates/rnaseq/RESULTS/lablog_rnaseq_results
@@ -5,5 +5,15 @@ mkdir $DELIVERY_FOLDER
 # RNASEQ service
 cd $DELIVERY_FOLDER
 
-# Links to reports
+# Links to multiqc reports
 ln -s ../../ANALYSIS/*RNASEQ/*rnaseq/multiqc/star_salmon/multiqc_report.html .
+
+# Links to differential expression folders
+# REMINDER: please make sure that subfolders within /*_DIFFERENTIAL_EXPRESSION/ follow the structure [number]_*.
+# Otherwise, change the following command so that symlinks are created correctly.
+# Check this path: /ANALYSIS/[DATE]_ANALYSIS0X_DIFFERENTIAL_EXPRESSION/ to see the names of the folders  
+ln -s ../../ANALYSIS/*_DIFFERENTIAL_EXPRESSION/[0-9]*_* .
+
+# Links to counts files
+ln -s ../../ANALYSIS/*_RNASEQ/*_rnaseq/star_salmon/salmon.merged.gene_counts.tsv .
+ln -s ../../ANALYSIS/*_RNASEQ/02-differential_expression/99-stats/normalized_expression.csv .

From 450fadbd1f9472441253574584a97dc2c842ff20 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 18 Jun 2024 13:08:06 +0200
Subject: [PATCH 042/321] Modified viralrecon results lablog

---
 .../templates/viralrecon/RESULTS/lablog_viralrecon_results      | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results b/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
index 4e691b91a..d7363bd2d 100755
--- a/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
+++ b/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
@@ -20,7 +20,7 @@ cat references.tmp | while read in; do cd excel_files_${in}; ln -s ../../../ANAL
 #Create symbolic links to files that are going to be converted to excel
 cat references.tmp | while read in; do ln -s ../../ANALYSIS/*/*${in}*/variants/ivar/variants_long_table.csv ${in}_variants_long_table.csv; done
 
-for ref in $(cut -f2 ../../ANALYSIS/samples_ref.txt | sort | uniq); do for organism in $(cut -f3 ../../ANALYSIS/samples_ref.txt | tr '[:lower:]' '[:upper:]' | sort | uniq); do report="../../ANALYSIS/*_${organism}/${ref}_*_viralrecon_mapping/multiqc/multiqc_report.html"; if [ -e $report ]; then ln -s ${report} ./multiqc_report_${ref}_${organism}.html; fi; done; done
+for ref in $(cut -f2 ../../ANALYSIS/samples_ref.txt | sort | uniq); do for organism in $(cut -f3 ../../ANALYSIS/samples_ref.txt | tr '[:lower:]' '[:upper:]' | sort | uniq); do report="../../ANALYSIS/*_${organism}/${ref}_*_viralrecon_mapping/multiqc/multiqc_report.html"; if [ -e $report ]; then ln -s ${report} ./multiqc_report_${ref}_${organism}.html; else echo "Multiqc report not found for reference $reference and organism $organism"; fi; done; done
 ln -s ../../ANALYSIS/*_MAG/99-stats/multiqc_report.html ./krona_results.html
 ln -s ../../ANALYSIS/*/mapping_illumina*.tab ./mapping_illumina.csv
 ln -s ../../ANALYSIS/*/assembly_stats.csv ./assembly_stats.csv

From 942adad65341e2e3913bfde9556277484b31d5a5 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 18 Jun 2024 13:12:13 +0200
Subject: [PATCH 043/321] Fixed minor mistake in viralrecon results lablog

---
 .../templates/viralrecon/RESULTS/lablog_viralrecon_results      | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results b/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
index d7363bd2d..a46faba6b 100755
--- a/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
+++ b/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
@@ -20,7 +20,7 @@ cat references.tmp | while read in; do cd excel_files_${in}; ln -s ../../../ANAL
 #Create symbolic links to files that are going to be converted to excel
 cat references.tmp | while read in; do ln -s ../../ANALYSIS/*/*${in}*/variants/ivar/variants_long_table.csv ${in}_variants_long_table.csv; done
 
-for ref in $(cut -f2 ../../ANALYSIS/samples_ref.txt | sort | uniq); do for organism in $(cut -f3 ../../ANALYSIS/samples_ref.txt | tr '[:lower:]' '[:upper:]' | sort | uniq); do report="../../ANALYSIS/*_${organism}/${ref}_*_viralrecon_mapping/multiqc/multiqc_report.html"; if [ -e $report ]; then ln -s ${report} ./multiqc_report_${ref}_${organism}.html; else echo "Multiqc report not found for reference $reference and organism $organism"; fi; done; done
+for ref in $(cut -f2 ../../ANALYSIS/samples_ref.txt | sort | uniq); do for organism in $(cut -f3 ../../ANALYSIS/samples_ref.txt | tr '[:lower:]' '[:upper:]' | sort | uniq); do report="../../ANALYSIS/*_${organism}/${ref}_*_viralrecon_mapping/multiqc/multiqc_report.html"; if [ -e $report ]; then ln -s ${report} ./multiqc_report_${ref}_${organism}.html; else echo "Multiqc report not found for reference $ref and organism $organism"; fi; done; done
 ln -s ../../ANALYSIS/*_MAG/99-stats/multiqc_report.html ./krona_results.html
 ln -s ../../ANALYSIS/*/mapping_illumina*.tab ./mapping_illumina.csv
 ln -s ../../ANALYSIS/*/assembly_stats.csv ./assembly_stats.csv

From d9077ca96aa531f16d4775ebf82e3398b2a50ba1 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 29 Apr 2024 12:58:11 +0200
Subject: [PATCH 044/321] Modified bioinfo_doc.py so that new lines are applied
 when creating the .pdf file

---
 bu_isciii/bioinfo_doc.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index b598f344b..4ef4f80f2 100755
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -290,7 +290,7 @@ def post_delivery_info(self):
 
         if self.provided_txt:
             with open(os.path.expanduser(self.provided_txt)) as f:
-                self.delivery_notes = " ".join([x.strip() for x in f.readlines()])
+                self.delivery_notes = "\n".join([x.strip() for x in f.readlines()])
         else:
             self.delivery_notes = bu_isciii.utils.ask_for_some_text(
                 msg="Write some delivery notes:"

From 951daa9e8f340fbee05df6a087253f880ae0a803 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 29 Apr 2024 13:16:28 +0200
Subject: [PATCH 045/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 7a728ca18..3d378aa4b 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -61,6 +61,7 @@ Code contributions to the new version:
 - Fixed archive module. Updated correct header for scout tsv [#258](https://github.com/BU-ISCIII/buisciii-tools/pull/258).
 - Fixed clean module. Corrected purge_files function. Renaming stage moved from clean to rename_nocopy option. Updated services.json file with correct paths for some services. [#280](https://github.com/BU-ISCIII/buisciii-tools/pull/280)
 - Fixed autoclean-sftp function. [#281](https://github.com/BU-ISCIII/buisciii-tools/pull/281)
+- Fixed bioinfo_doc.py. Modified it so that this module creates a .pdf file including new-line characters, without merging lines into one single line [#259](https://github.com/BU-ISCIII/buisciii-tools/pull/259).
 
 #### Changed
 

From d864debb3046593b2a5b44fbaa3aae032d8abf25 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 25 Jun 2024 10:37:19 +0200
Subject: [PATCH 046/321] New attempt: added the nl2br markdown extension

---
 bu_isciii/bioinfo_doc.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index 4ef4f80f2..37c95eec1 100755
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -290,7 +290,7 @@ def post_delivery_info(self):
 
         if self.provided_txt:
             with open(os.path.expanduser(self.provided_txt)) as f:
-                self.delivery_notes = "\n".join([x.strip() for x in f.readlines()])
+                self.delivery_notes = f.read()
         else:
             self.delivery_notes = bu_isciii.utils.ask_for_some_text(
                 msg="Write some delivery notes:"
@@ -388,6 +388,7 @@ def convert_markdown_to_html(self, mk_text):
                 "pymdownx.highlight",
                 "pymdownx.emoji",
                 "pymdownx.tilde",
+		"nl2br",
             ],
             extension_configs={
                 "pymdownx.b64": {

From c8497ef5437934d46323f2d13c40cad894f4504e Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 25 Jun 2024 11:01:37 +0200
Subject: [PATCH 047/321] Fixed linting mistake

---
 bu_isciii/bioinfo_doc.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index 37c95eec1..a66ecd282 100755
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -388,7 +388,7 @@ def convert_markdown_to_html(self, mk_text):
                 "pymdownx.highlight",
                 "pymdownx.emoji",
                 "pymdownx.tilde",
-		"nl2br",
+                "nl2br",
             ],
             extension_configs={
                 "pymdownx.b64": {

From 08ad531cc3808fa9a7f6830ad82dd806db7f7f5d Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Fri, 21 Jun 2024 14:07:21 +0200
Subject: [PATCH 048/321] Created mag template

---
 .../ANALYSIS/ANALYSIS02_MAG/99-stats/lablog   | 25 ++++++++++++++++
 .../99-stats/multiqc_config.yaml              | 13 ++++++++
 .../mag/ANALYSIS/ANALYSIS02_MAG/lablog        | 30 +++++++++++++++++++
 bu_isciii/templates/mag/ANALYSIS/lablog_mag   |  1 +
 bu_isciii/templates/mag/DOC/mag.config        | 19 ++++++++++++
 bu_isciii/templates/mag/RAW/README            |  1 +
 bu_isciii/templates/mag/REFERENCES/README     |  1 +
 .../templates/mag/RESULTS/lablog_mag_results  |  6 ++++
 bu_isciii/templates/mag/TMP/README            |  1 +
 bu_isciii/templates/services.json             |  2 +-
 10 files changed, 98 insertions(+), 1 deletion(-)
 create mode 100644 bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog
 create mode 100644 bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/multiqc_config.yaml
 create mode 100644 bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog
 create mode 100644 bu_isciii/templates/mag/ANALYSIS/lablog_mag
 create mode 100644 bu_isciii/templates/mag/DOC/mag.config
 create mode 100644 bu_isciii/templates/mag/RAW/README
 create mode 100644 bu_isciii/templates/mag/REFERENCES/README
 create mode 100755 bu_isciii/templates/mag/RESULTS/lablog_mag_results
 create mode 100644 bu_isciii/templates/mag/TMP/README

diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog
new file mode 100644
index 000000000..246dae5d4
--- /dev/null
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog
@@ -0,0 +1,25 @@
+#module load singularity
+
+cat ../../samples_id.txt | while read in; do ln -s ../*_mag/Taxonomy/kraken2/${in}/kraken2_report.txt ./${in}_kraken2_report.txt; done
+
+scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+
+cat <<EOF > multiqc.sbatch
+#!/bin/sh
+#SBATCH --ntasks 1
+#SBATCH --cpus-per-task 2
+#SBATCH --mem 4G
+#SBATCH --time 00:30:00
+#SBATCH --partition short_idx
+#SBATCH --output $(date '+%Y%m%d')_multiqc.log
+#SBATCH --chdir $scratch_dir
+
+export NXF_OPTS="-Xms500M -Xmx4G"
+
+singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/multiqc:1.9--py_1 multiqc -d . --config multiqc_config.yaml
+
+EOF
+
+echo "sbatch multiqc.sbatch" > _01_run_multiqc.sh
+
+echo "find -type l | while read in; do unlink \${in}; done" > _02_unlink.sh
diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/multiqc_config.yaml b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/multiqc_config.yaml
new file mode 100644
index 000000000..96b7e6136
--- /dev/null
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/multiqc_config.yaml
@@ -0,0 +1,13 @@
+extra_fn_clean_exts:
+    - _R1
+    - _R2
+    - .R1
+    - .R2
+    - .sort
+    - _sort
+    - .stats
+    - _bamstat
+    - _align
+    - .txt
+report_comment: >
+    This report has been generated by BU-ISCIII
diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog
new file mode 100644
index 000000000..39408a717
--- /dev/null
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog
@@ -0,0 +1,30 @@
+ln -s ../00-reads .
+ln -s ../samples_id.txt .
+
+#module load Nextflow
+#module load singularity
+
+scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+
+cat <<EOF > mag.sbatch
+#!/bin/sh
+#SBATCH --ntasks 1
+#SBATCH --cpus-per-task 2
+#SBATCH --mem 4G
+#SBATCH --time 2:00:00
+#SBATCH --partition middle_idx
+#SBATCH --output $(date '+%Y%m%d')_mag.log
+#SBATCH --chdir $scratch_dir
+
+export NXF_OPTS="-Xms500M -Xmx4G"
+
+nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-2.1.1/workflow/main.nf \\
+          -c ../../DOC/mag.config \\
+          --input '00-reads/*_R{1,2}.fastq.gz' \\
+          --outdir $(date '+%Y%m%d')_mag \\
+          --kraken2_db /data/bi/references/kraken/minikraken_8GB_20200312.tgz \\
+          --skip_busco --skip_spades --skip_spadeshybrid --skip_megahit --skip_prodigal --skip_binning \\
+          -resume
+EOF
+
+echo "sbatch mag.sbatch" > _01_run_mag.sh
diff --git a/bu_isciii/templates/mag/ANALYSIS/lablog_mag b/bu_isciii/templates/mag/ANALYSIS/lablog_mag
new file mode 100644
index 000000000..5076f4425
--- /dev/null
+++ b/bu_isciii/templates/mag/ANALYSIS/lablog_mag
@@ -0,0 +1 @@
+mv ANALYSIS02_MAG $(date '+%Y%m%d')_ANALYSIS02_MAG
diff --git a/bu_isciii/templates/mag/DOC/mag.config b/bu_isciii/templates/mag/DOC/mag.config
new file mode 100644
index 000000000..732980bf1
--- /dev/null
+++ b/bu_isciii/templates/mag/DOC/mag.config
@@ -0,0 +1,19 @@
+singularity {
+	enabled = true
+	autoMounts = true
+}
+
+process {
+	executor = 'slurm'
+	queue = 'middle_idx'
+	queue = 'middle_idx'
+        errorStrategy = { task.exitStatus in [140,143,137,138,104,134,139] ? 'retry' : 'finish'; task.exitStatus in [1,4,255] ? 'ignore' : 'finish' }
+        maxRetries = 1
+        maxErrors = '-1'
+}
+
+params {
+	max_memory = 376.GB
+	max_cpus = 32
+	max_time = '48.h'
+}
diff --git a/bu_isciii/templates/mag/RAW/README b/bu_isciii/templates/mag/RAW/README
new file mode 100644
index 000000000..a774e7bb8
--- /dev/null
+++ b/bu_isciii/templates/mag/RAW/README
@@ -0,0 +1 @@
+##Folder to hold raw reads to analyze in the service
diff --git a/bu_isciii/templates/mag/REFERENCES/README b/bu_isciii/templates/mag/REFERENCES/README
new file mode 100644
index 000000000..3ce2a2815
--- /dev/null
+++ b/bu_isciii/templates/mag/REFERENCES/README
@@ -0,0 +1 @@
+##Folder to hold references of the service
diff --git a/bu_isciii/templates/mag/RESULTS/lablog_mag_results b/bu_isciii/templates/mag/RESULTS/lablog_mag_results
new file mode 100755
index 000000000..55bc4c0e5
--- /dev/null
+++ b/bu_isciii/templates/mag/RESULTS/lablog_mag_results
@@ -0,0 +1,6 @@
+mkdir $(date '+%Y%m%d')_entrega01
+cd $(date '+%Y%m%d')_entrega01
+
+#Create symbolic links depending on the analysis
+#Individual files
+ln -s ../../ANALYSIS/*_MAG/99-stats/multiqc_report.html ./krona_results.html
diff --git a/bu_isciii/templates/mag/TMP/README b/bu_isciii/templates/mag/TMP/README
new file mode 100644
index 000000000..ba3229456
--- /dev/null
+++ b/bu_isciii/templates/mag/TMP/README
@@ -0,0 +1 @@
+##Folder to hold temporary files
diff --git a/bu_isciii/templates/services.json b/bu_isciii/templates/services.json
index bb88dfafb..7463cd5c4 100755
--- a/bu_isciii/templates/services.json
+++ b/bu_isciii/templates/services.json
@@ -222,7 +222,7 @@
     },
     "mag_met": {
       "label": "",
-      "template": "mag_met",
+      "template": "mag",
       "order": 2,
       "begin": "base",
       "end": "",

From 550609d7375d75f5333dcfd01a012eb20660fe2a Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Fri, 21 Jun 2024 15:53:09 +0200
Subject: [PATCH 049/321] removed mag from other templates

---
 .../ANALYSIS/ANALYSIS02_MET/99-stats/lablog   | 25 ----------------
 .../99-stats/multiqc_config.yaml              | 13 --------
 .../IRMA/ANALYSIS/ANALYSIS02_MET/lablog       | 30 -------------------
 bu_isciii/templates/IRMA/ANALYSIS/lablog_irma |  1 -
 bu_isciii/templates/IRMA/DOC/mag.config       | 19 ------------
 .../IRMA/RESULTS/lablog_irma_results          |  1 -
 .../DATE_ANALYSIS0X_MAG/99-stats/lablog       | 27 -----------------
 .../ANALYSIS/DATE_ANALYSIS0X_MAG/lablog       | 30 -------------------
 .../viralrecon/ANALYSIS/lablog_viralrecon     |  1 -
 bu_isciii/templates/viralrecon/DOC/mag.config | 19 ------------
 .../viralrecon/DOC/multiqc_config.yml         | 13 --------
 .../RESULTS/lablog_viralrecon_results         |  1 -
 12 files changed, 180 deletions(-)
 delete mode 100644 bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS02_MET/99-stats/lablog
 delete mode 100644 bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS02_MET/99-stats/multiqc_config.yaml
 delete mode 100644 bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS02_MET/lablog
 delete mode 100644 bu_isciii/templates/IRMA/DOC/mag.config
 delete mode 100644 bu_isciii/templates/viralrecon/ANALYSIS/DATE_ANALYSIS0X_MAG/99-stats/lablog
 delete mode 100644 bu_isciii/templates/viralrecon/ANALYSIS/DATE_ANALYSIS0X_MAG/lablog
 delete mode 100644 bu_isciii/templates/viralrecon/DOC/mag.config
 delete mode 100644 bu_isciii/templates/viralrecon/DOC/multiqc_config.yml

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS02_MET/99-stats/lablog b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS02_MET/99-stats/lablog
deleted file mode 100644
index 246dae5d4..000000000
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS02_MET/99-stats/lablog
+++ /dev/null
@@ -1,25 +0,0 @@
-#module load singularity
-
-cat ../../samples_id.txt | while read in; do ln -s ../*_mag/Taxonomy/kraken2/${in}/kraken2_report.txt ./${in}_kraken2_report.txt; done
-
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-
-cat <<EOF > multiqc.sbatch
-#!/bin/sh
-#SBATCH --ntasks 1
-#SBATCH --cpus-per-task 2
-#SBATCH --mem 4G
-#SBATCH --time 00:30:00
-#SBATCH --partition short_idx
-#SBATCH --output $(date '+%Y%m%d')_multiqc.log
-#SBATCH --chdir $scratch_dir
-
-export NXF_OPTS="-Xms500M -Xmx4G"
-
-singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/multiqc:1.9--py_1 multiqc -d . --config multiqc_config.yaml
-
-EOF
-
-echo "sbatch multiqc.sbatch" > _01_run_multiqc.sh
-
-echo "find -type l | while read in; do unlink \${in}; done" > _02_unlink.sh
diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS02_MET/99-stats/multiqc_config.yaml b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS02_MET/99-stats/multiqc_config.yaml
deleted file mode 100644
index 96b7e6136..000000000
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS02_MET/99-stats/multiqc_config.yaml
+++ /dev/null
@@ -1,13 +0,0 @@
-extra_fn_clean_exts:
-    - _R1
-    - _R2
-    - .R1
-    - .R2
-    - .sort
-    - _sort
-    - .stats
-    - _bamstat
-    - _align
-    - .txt
-report_comment: >
-    This report has been generated by BU-ISCIII
diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS02_MET/lablog b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS02_MET/lablog
deleted file mode 100644
index 21e0456ac..000000000
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS02_MET/lablog
+++ /dev/null
@@ -1,30 +0,0 @@
-ln -s ../00-reads .
-ln -s ../samples_id.txt .
-
-#module load Nextflow
-#module load singularity
-
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-
-cat <<EOF > mag.sbatch
-#!/bin/sh
-#SBATCH --ntasks 1
-#SBATCH --cpus-per-task 2
-#SBATCH --mem 4G
-#SBATCH --time 2:00:00
-#SBATCH --partition middle_idx
-#SBATCH --output $(date '+%Y%m%d')_mag.log
-#SBATCH --chdir $scratch_dir
-
-export NXF_OPTS="-Xms500M -Xmx4G"
-
-nextflow run /scratch/bi/pipelines/nf-core-mag-2.1.1/workflow/main.nf \\
-          -c ../../DOC/mag.config \\
-          --input '00-reads/*_R{1,2}.fastq.gz' \\
-          --outdir $(date '+%Y%m%d')_mag \\
-          --kraken2_db /data/bi/references/kraken/minikraken_8GB_20200312.tgz \\
-          --skip_busco --skip_spades --skip_spadeshybrid --skip_megahit --skip_prodigal --skip_binning \\
-          -resume
-EOF
-
-echo "sbatch mag.sbatch" > _01_run_mag.sh
diff --git a/bu_isciii/templates/IRMA/ANALYSIS/lablog_irma b/bu_isciii/templates/IRMA/ANALYSIS/lablog_irma
index 3f99b6b0d..798ee5497 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/lablog_irma
+++ b/bu_isciii/templates/IRMA/ANALYSIS/lablog_irma
@@ -1,5 +1,4 @@
 #ls ../RAW/* | tr '\/' '\t' | cut -f3 | cut -d "_" -f 1 | sort -u | grep -v "md5" > samples_id.txt
 mkdir -p 00-reads
 mv ANALYSIS01_FLU_IRMA $(date '+%Y%m%d')_ANALYSIS01_FLU_IRMA
-mv ANALYSIS02_MET $(date '+%Y%m%d')_ANALYSIS02_MET
 cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R1*.fastq.gz %_R1.fastq.gz" | bash; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R2*.fastq.gz %_R2.fastq.gz" | bash; cd -
\ No newline at end of file
diff --git a/bu_isciii/templates/IRMA/DOC/mag.config b/bu_isciii/templates/IRMA/DOC/mag.config
deleted file mode 100644
index 732980bf1..000000000
--- a/bu_isciii/templates/IRMA/DOC/mag.config
+++ /dev/null
@@ -1,19 +0,0 @@
-singularity {
-	enabled = true
-	autoMounts = true
-}
-
-process {
-	executor = 'slurm'
-	queue = 'middle_idx'
-	queue = 'middle_idx'
-        errorStrategy = { task.exitStatus in [140,143,137,138,104,134,139] ? 'retry' : 'finish'; task.exitStatus in [1,4,255] ? 'ignore' : 'finish' }
-        maxRetries = 1
-        maxErrors = '-1'
-}
-
-params {
-	max_memory = 376.GB
-	max_cpus = 32
-	max_time = '48.h'
-}
diff --git a/bu_isciii/templates/IRMA/RESULTS/lablog_irma_results b/bu_isciii/templates/IRMA/RESULTS/lablog_irma_results
index eee33aa6a..5cb7c418d 100755
--- a/bu_isciii/templates/IRMA/RESULTS/lablog_irma_results
+++ b/bu_isciii/templates/IRMA/RESULTS/lablog_irma_results
@@ -3,7 +3,6 @@ cd $(date '+%Y%m%d')_entrega01
 
 #Create symbolic links depending on the analysis
 #Individual files
-ln -s ../../ANALYSIS/*_MET/99-stats/multiqc_report.html ./krona_results.html
 ln -s ../../ANALYSIS/*FLU_IRMA/04-irma/all_samples_completo.txt .
 ln -s ../../ANALYSIS/*FLU_IRMA/04-irma/A_H* .
 ln -s ../../ANALYSIS/*FLU_IRMA/04-irma/B .
diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/DATE_ANALYSIS0X_MAG/99-stats/lablog b/bu_isciii/templates/viralrecon/ANALYSIS/DATE_ANALYSIS0X_MAG/99-stats/lablog
deleted file mode 100644
index 6685af52f..000000000
--- a/bu_isciii/templates/viralrecon/ANALYSIS/DATE_ANALYSIS0X_MAG/99-stats/lablog
+++ /dev/null
@@ -1,27 +0,0 @@
-#module load singularity
-
-cat ../../samples_id.txt | while read in; do ln -s ../*_mag/Taxonomy/kraken2/${in}/kraken2_report.txt ./${in}_kraken2_report.txt; done
-
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-
-cat <<EOF > multiqc.sbatch
-#!/bin/sh
-#SBATCH --ntasks 1
-#SBATCH --cpus-per-task 2
-#SBATCH --mem 4G
-#SBATCH --time 00:30:00
-#SBATCH --partition short_idx
-#SBATCH --output $(date '+%Y%m%d')_multiqc.log
-#SBATCH --chdir $scratch_dir
-
-export NXF_OPTS="-Xms500M -Xmx4G"
-
-singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/multiqc:1.9--py_1 multiqc -d . --config multiqc_config.yaml
-
-EOF
-
-echo "sbatch multiqc.sbatch" > _01_run_multiqc.sh
-
-ln -s ../../../DOC/multiqc_config.yml .
-
-echo "find -type l | while read in; do unlink \${in}; done" > _02_unlink.sh
diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/DATE_ANALYSIS0X_MAG/lablog b/bu_isciii/templates/viralrecon/ANALYSIS/DATE_ANALYSIS0X_MAG/lablog
deleted file mode 100644
index 83e293d6f..000000000
--- a/bu_isciii/templates/viralrecon/ANALYSIS/DATE_ANALYSIS0X_MAG/lablog
+++ /dev/null
@@ -1,30 +0,0 @@
-ln -s ../00-reads .
-ln -s ../samples_id.txt .
-
-#module load Nextflow
-#module load singularity
-
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-
-cat <<EOF > mag.sbatch
-#!/bin/sh
-#SBATCH --ntasks 1
-#SBATCH --cpus-per-task 2
-#SBATCH --mem 4G
-#SBATCH --time 2:00:00
-#SBATCH --partition middle_idx
-#SBATCH --output $(date '+%Y%m%d')_mag.log
-#SBATCH --chdir $scratch_dir
-
-export NXF_OPTS="-Xms500M -Xmx4G"
-
-nextflow run /data/bi/pipelines/nf-core-mag-2.1.1/workflow/main.nf \\
-          -c ../../DOC/mag.config \\
-          --input '00-reads/*_R{1,2}.fastq.gz' \\
-          --outdir $(date '+%Y%m%d')_mag \\
-          --kraken2_db /data/bi/references/kraken/minikraken_8GB_20200312.tgz \\
-          --skip_busco --skip_spades --skip_spadeshybrid --skip_megahit --skip_prodigal --skip_binning \\
-          -resume
-EOF
-
-echo "sbatch mag.sbatch" > _01_run_mag.sh
diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 916f3d7fb..f63925f21 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -401,7 +401,6 @@ rm create_summary_report.sh
 rm deduplicate_long_table.sh
 rm percentajeNs.py
 rm _02_create_run_percentage_Ns.sh
-mv DATE_ANALYSIS0X_MAG $(date '+%Y%m%d')_ANALYSIS0X_MAG
 cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R1*.fastq.gz %_R1.fastq.gz" | bash; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R2*.fastq.gz %_R2.fastq.gz" | bash; cd ..
 
 echo_green "\nLablog_viralrecon execution has been completed successfully!"
\ No newline at end of file
diff --git a/bu_isciii/templates/viralrecon/DOC/mag.config b/bu_isciii/templates/viralrecon/DOC/mag.config
deleted file mode 100644
index 732980bf1..000000000
--- a/bu_isciii/templates/viralrecon/DOC/mag.config
+++ /dev/null
@@ -1,19 +0,0 @@
-singularity {
-	enabled = true
-	autoMounts = true
-}
-
-process {
-	executor = 'slurm'
-	queue = 'middle_idx'
-	queue = 'middle_idx'
-        errorStrategy = { task.exitStatus in [140,143,137,138,104,134,139] ? 'retry' : 'finish'; task.exitStatus in [1,4,255] ? 'ignore' : 'finish' }
-        maxRetries = 1
-        maxErrors = '-1'
-}
-
-params {
-	max_memory = 376.GB
-	max_cpus = 32
-	max_time = '48.h'
-}
diff --git a/bu_isciii/templates/viralrecon/DOC/multiqc_config.yml b/bu_isciii/templates/viralrecon/DOC/multiqc_config.yml
deleted file mode 100644
index 96b7e6136..000000000
--- a/bu_isciii/templates/viralrecon/DOC/multiqc_config.yml
+++ /dev/null
@@ -1,13 +0,0 @@
-extra_fn_clean_exts:
-    - _R1
-    - _R2
-    - .R1
-    - .R2
-    - .sort
-    - _sort
-    - .stats
-    - _bamstat
-    - _align
-    - .txt
-report_comment: >
-    This report has been generated by BU-ISCIII
diff --git a/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results b/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
index a46faba6b..d05b2ab77 100755
--- a/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
+++ b/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
@@ -21,7 +21,6 @@ cat references.tmp | while read in; do cd excel_files_${in}; ln -s ../../../ANAL
 cat references.tmp | while read in; do ln -s ../../ANALYSIS/*/*${in}*/variants/ivar/variants_long_table.csv ${in}_variants_long_table.csv; done
 
 for ref in $(cut -f2 ../../ANALYSIS/samples_ref.txt | sort | uniq); do for organism in $(cut -f3 ../../ANALYSIS/samples_ref.txt | tr '[:lower:]' '[:upper:]' | sort | uniq); do report="../../ANALYSIS/*_${organism}/${ref}_*_viralrecon_mapping/multiqc/multiqc_report.html"; if [ -e $report ]; then ln -s ${report} ./multiqc_report_${ref}_${organism}.html; else echo "Multiqc report not found for reference $ref and organism $organism"; fi; done; done
-ln -s ../../ANALYSIS/*_MAG/99-stats/multiqc_report.html ./krona_results.html
 ln -s ../../ANALYSIS/*/mapping_illumina*.tab ./mapping_illumina.csv
 ln -s ../../ANALYSIS/*/assembly_stats.csv ./assembly_stats.csv
 ln -s ../../ANALYSIS/*/01-PikaVirus-results/all_samples_virus_table_filtered.tsv ./pikavirus_table.tsv

From 9d8b08d26a853dc0cca4a21e16ed9be61a14cc9c Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Fri, 21 Jun 2024 15:54:13 +0200
Subject: [PATCH 050/321] Fixed new service to handle more than one service_id

---
 bu_isciii/new_service.py | 16 ++++++----------
 1 file changed, 6 insertions(+), 10 deletions(-)

diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index cbbfe81ee..f3ab412bc 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -125,16 +125,19 @@ def copy_template(self):
         )
         services_ids = bu_isciii.utils.get_service_ids(self.services_requested)
         services_json = bu_isciii.service_json.ServiceJson()
-        if len(services_ids) == 1:
+        for service_id in services_ids:
             try:
-                service_template = services_json.get_find(services_ids[0], "template")
+                service_template = services_json.get_find(service_id, "template")
+                service_end = services_json.get_find(service_id, "end")
             except KeyError as e:
                 stderr.print(
                     "[red]ERROR: Service id %s not found in services json file."
-                    % services_ids[0]
+                    % service_id
                 )
                 stderr.print("traceback error %s" % e)
                 sys.exit()
+            if service_end not in services_ids and service_end != '':
+                services_ids.append(service_end)
             try:
                 shutil.copytree(
                     os.path.join(
@@ -153,13 +156,6 @@ def copy_template(self):
                 stderr.print("[red]ERROR: Copying template failed.")
                 stderr.print("traceback error %s" % e)
                 sys.exit()
-        else:
-            stderr.print(
-                "[red] ERROR: I'm not already prepared for handling more than one error at the same time, sorry!"
-                "Please re-run and select one of the service ids."
-            )
-            sys.exit(1)
-            return False
         return True
 
     def create_samples_id(self):

From 681bbe64a6a93577fd8abe32802d865f357c78c9 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Mon, 24 Jun 2024 09:03:11 +0200
Subject: [PATCH 051/321] moved the code to utils

---
 bu_isciii/new_service.py |  3 ---
 bu_isciii/utils.py       | 14 ++++++++++++++
 2 files changed, 14 insertions(+), 3 deletions(-)

diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index f3ab412bc..c775b928a 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -128,7 +128,6 @@ def copy_template(self):
         for service_id in services_ids:
             try:
                 service_template = services_json.get_find(service_id, "template")
-                service_end = services_json.get_find(service_id, "end")
             except KeyError as e:
                 stderr.print(
                     "[red]ERROR: Service id %s not found in services json file."
@@ -136,8 +135,6 @@ def copy_template(self):
                 )
                 stderr.print("traceback error %s" % e)
                 sys.exit()
-            if service_end not in services_ids and service_end != '':
-                services_ids.append(service_end)
             try:
                 shutil.copytree(
                     os.path.join(
diff --git a/bu_isciii/utils.py b/bu_isciii/utils.py
index 821210b3c..5408e7c72 100755
--- a/bu_isciii/utils.py
+++ b/bu_isciii/utils.py
@@ -6,6 +6,7 @@
 import json
 import os
 import tarfile
+import sys
 
 import questionary
 import rich
@@ -167,6 +168,19 @@ def get_service_ids(services_requested):
         if services["service_id"] is not None:
             service_id_list.append(services["service_id"])
             service_id_list_all.append(services["service_id"])
+            services_json = bu_isciii.service_json.ServiceJson()
+            try:
+                service_end = services_json.get_find(services["service_id"], "end")
+            except KeyError as e:
+                stderr.print(
+                    "[red]ERROR: Service id %s not found in services json file."
+                    % services["service_id"]
+                )
+                stderr.print("traceback error %s" % e)
+                sys.exit()
+            if service_end not in service_id_list and service_end != '':
+                service_id_list.append(service_end)
+                service_id_list_all.append(service_end)
     service_id_list_all.append("all")
     stderr.print("Which selected service do you want to manage?")
     services_sel = [prompt_selection("Service label:", service_id_list_all)]

From f422a4728ee7b54d38d0030d807b3a3899347870 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Tue, 25 Jun 2024 14:53:08 +0200
Subject: [PATCH 052/321] Fixed multiple service in clean module

---
 bu_isciii/clean.py | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/bu_isciii/clean.py b/bu_isciii/clean.py
index 3dba081c0..63a42b8bc 100644
--- a/bu_isciii/clean.py
+++ b/bu_isciii/clean.py
@@ -129,10 +129,9 @@ def get_clean_items(self, services_ids, type="files"):
         for service in services_ids:
             try:
                 items = service_conf.get_find_deep(service, type)
-                if len(clean_items_list) == 0 and len(items) > 0:
-                    clean_items_list = items
-                elif len(items) > 0:
-                    clean_items_list.append(items)
+                for item in items:
+                    if item not in clean_items_list:
+                        clean_items_list.append(item)
             except KeyError as e:
                 stderr.print(
                     "[red]ERROR: Service id %s not found in services json file."

From 90df9e91fde9c87c47614e78ae153861bba2cd63 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Tue, 25 Jun 2024 14:53:50 +0200
Subject: [PATCH 053/321] fixed multiple services in copy_sftp module

---
 bu_isciii/copy_sftp.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/copy_sftp.py b/bu_isciii/copy_sftp.py
index 0c1851424..cfd2b3890 100644
--- a/bu_isciii/copy_sftp.py
+++ b/bu_isciii/copy_sftp.py
@@ -112,8 +112,9 @@ def get_last_folders(self, services_ids, type="last_folder"):
         last_folders_list = []
         for service in services_ids:
             try:
-                items = service_conf.get_find_deep(service, type)
-                last_folders_list.append(items)
+                item = service_conf.get_find_deep(service, type)
+                if item not in last_folders_list:
+                    last_folders_list.append(item)
             except KeyError as e:
                 stderr.print(
                     "[red]ERROR: Service id %s not found in services json file."

From b19358fb57e4507525e84f74755d47cc7ca7a802 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Tue, 25 Jun 2024 16:51:18 +0200
Subject: [PATCH 054/321] Fixed variable name for stderr

---
 bu_isciii/new_service.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index c775b928a..eca0f8cd1 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -207,8 +207,8 @@ def create_symbolic_links(self):
                     )
                 except OSError as e:
                     stderr.print(
-                        "[red]ERROR: Symbolic links creation failed for sample %s."
-                        % sample["sampleName"]
+                        "[red]ERROR: Symbolic links creation failed for file %s."
+                        % file
                     )
                     stderr.print("Traceback: %s" % e)
                     sys.exit()

From 21332741d3968155e31c1314b471e12cc73ba07d Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Tue, 25 Jun 2024 16:51:50 +0200
Subject: [PATCH 055/321] Allow to continue after symb link error

---
 bu_isciii/new_service.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index eca0f8cd1..280061738 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -211,7 +211,7 @@ def create_symbolic_links(self):
                         % file
                     )
                     stderr.print("Traceback: %s" % e)
-                    sys.exit()
+                    continue
 
     def samples_json(self):
         json_samples = json.dumps(self.service_samples, indent=4)

From 39de6de948e81651eacaf384488cd7716a196488 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Tue, 25 Jun 2024 16:52:29 +0200
Subject: [PATCH 056/321] Avoid updating to in_progress when already
 in_progress

---
 bu_isciii/new_service.py | 23 +++++++++++++----------
 1 file changed, 13 insertions(+), 10 deletions(-)

diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index 280061738..e0faaa5e8 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -230,9 +230,11 @@ def create_new_service(self):
             self.create_samples_id()
             self.create_symbolic_links()
             self.samples_json()
-            self.rest_api.put_request(
-                "update-state", "resolution", self.resolution_id, "state", "in_progress"
-            )
+            if self.resolution_info["service_state"] != "in_progress":
+                self.rest_api.put_request(
+                    "update-state", "resolution", self.resolution_id, "state", "in_progress"
+                )
+
         else:
             stderr.print(
                 "[yellow]WARN: No samples recorded in service: " + self.resolution_id
@@ -240,13 +242,14 @@ def create_new_service(self):
             if bu_isciii.utils.prompt_yn_question("Do you want to proceed?: "):
                 self.create_folder()
                 self.copy_template()
-                self.rest_api.put_request(
-                    "update-state",
-                    "resolution",
-                    self.resolution_id,
-                    "state",
-                    "in_progress",
-                )
+                if self.resolution_info["service_state"] != "in_progress":
+                    self.rest_api.put_request(
+                        "update-state",
+                        "resolution",
+                        self.resolution_id,
+                        "state",
+                        "in_progress",
+                    )
             else:
                 stderr.print("Directory not created. Bye!")
                 sys.exit(1)

From 80f5df8b38a216ef348adc4c0668295eacf55ffd Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Tue, 25 Jun 2024 16:58:21 +0200
Subject: [PATCH 057/321] fixed black

---
 bu_isciii/new_service.py | 9 ++++++---
 bu_isciii/utils.py       | 2 +-
 2 files changed, 7 insertions(+), 4 deletions(-)

diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index e0faaa5e8..f57e301da 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -207,8 +207,7 @@ def create_symbolic_links(self):
                     )
                 except OSError as e:
                     stderr.print(
-                        "[red]ERROR: Symbolic links creation failed for file %s."
-                        % file
+                        "[red]ERROR: Symbolic links creation failed for file %s." % file
                     )
                     stderr.print("Traceback: %s" % e)
                     continue
@@ -232,7 +231,11 @@ def create_new_service(self):
             self.samples_json()
             if self.resolution_info["service_state"] != "in_progress":
                 self.rest_api.put_request(
-                    "update-state", "resolution", self.resolution_id, "state", "in_progress"
+                    "update-state",
+                    "resolution",
+                    self.resolution_id,
+                    "state",
+                    "in_progress",
                 )
 
         else:
diff --git a/bu_isciii/utils.py b/bu_isciii/utils.py
index 5408e7c72..07ba82939 100755
--- a/bu_isciii/utils.py
+++ b/bu_isciii/utils.py
@@ -178,7 +178,7 @@ def get_service_ids(services_requested):
                 )
                 stderr.print("traceback error %s" % e)
                 sys.exit()
-            if service_end not in service_id_list and service_end != '':
+            if service_end not in service_id_list and service_end != "":
                 service_id_list.append(service_end)
                 service_id_list_all.append(service_end)
     service_id_list_all.append("all")

From 9db234bdd2fe36858afbfd4faaabfcbffab79ca5 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Tue, 25 Jun 2024 17:44:34 +0200
Subject: [PATCH 058/321] Updated changelog

---
 CHANGELOG.md | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 3d378aa4b..f9a97e31a 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -48,6 +48,7 @@ Code contributions to the new version:
 - Fixed singularity-images path when updating pangolin database in lablog_viralrecon. Added line break after prompted input. [#282](https://github.com/BU-ISCIII/buisciii-tools/pull/282)
 - Updated characterization and snippy templates to fit bacass pipeline. Corrected path in 05-iqtree in snippy template. [#283](https://github.com/BU-ISCIII/buisciii-tools/pull/283)
 - Included multiqc_report.html in RESULTS folder in every service, where necessary [#265] (https://github.com/BU-ISCIII/buisciii-tools/pull/265)
+- Added MAG tempalte and removed MAG from other templates [#288](https://github.com/BU-ISCIII/buisciii-tools/pull/288)
 
 ### Modules
 
@@ -55,6 +56,7 @@ Code contributions to the new version:
 
 - PR [#274](https://github.com/BU-ISCIII/buisciii-tools/pull/274): added `--dev` option, configuration dev and test folder structure.
 - PR [#276](https://github.com/BU-ISCIII/buisciii-tools/pull/276): wkhtmlpdf does not need absolute path to executable. Added better error handling when executable does not exists.
+- PR [#288](https://github.com/BU-ISCIII/buisciii-tools/pull/288) Allowed to handle more than one service at a time, related to issue [#217](https://github.com/BU-ISCIII/buisciii-tools/issues/217)
 
 #### Fixes
 
@@ -62,6 +64,7 @@ Code contributions to the new version:
 - Fixed clean module. Corrected purge_files function. Renaming stage moved from clean to rename_nocopy option. Updated services.json file with correct paths for some services. [#280](https://github.com/BU-ISCIII/buisciii-tools/pull/280)
 - Fixed autoclean-sftp function. [#281](https://github.com/BU-ISCIII/buisciii-tools/pull/281)
 - Fixed bioinfo_doc.py. Modified it so that this module creates a .pdf file including new-line characters, without merging lines into one single line [#259](https://github.com/BU-ISCIII/buisciii-tools/pull/259).
+- PR [#288](https://github.com/BU-ISCIII/buisciii-tools/pull/288) Fixed updating service's state to in_progress multiple times, related with issue [#285](https://github.com/BU-ISCIII/buisciii-tools/issues/285)
 
 #### Changed
 

From 0c2fd23d99bbcd70f564137e27ba6085e9a3e89f Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 27 Jun 2024 09:10:40 +0200
Subject: [PATCH 059/321] Removed owner Pablo

---
 bu_isciii/config_json.py  | 1 -
 bu_isciii/service_json.py | 1 -
 2 files changed, 2 deletions(-)

diff --git a/bu_isciii/config_json.py b/bu_isciii/config_json.py
index cafad194b..5035ec938 100644
--- a/bu_isciii/config_json.py
+++ b/bu_isciii/config_json.py
@@ -24,7 +24,6 @@ def get_configuration(self, topic):
 
     def get_find(self, topic, found):
         """
-        Owner: Pablo
         Description:
             Obtain from topic any forward items from json data
         """
diff --git a/bu_isciii/service_json.py b/bu_isciii/service_json.py
index d9f2a280b..bbe8a1112 100644
--- a/bu_isciii/service_json.py
+++ b/bu_isciii/service_json.py
@@ -38,7 +38,6 @@ def get_service_configuration(self, service):
 
     def get_find(self, service, found):
         """
-        Owner: Pablo
         Description:
             Obtain from service any forward items from json data
         """

From 236bec09108ee1989d70fad9f5adef127d1646ca Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 27 Jun 2024 10:28:23 +0200
Subject: [PATCH 060/321] Changed safe to True

---
 bu_isciii/archive.py     | 4 ++--
 bu_isciii/bioinfo_doc.py | 4 ++--
 bu_isciii/clean.py       | 2 +-
 bu_isciii/copy_sftp.py   | 2 +-
 bu_isciii/new_service.py | 3 +--
 bu_isciii/scratch.py     | 2 +-
 6 files changed, 8 insertions(+), 9 deletions(-)

diff --git a/bu_isciii/archive.py b/bu_isciii/archive.py
index 6d84f1610..d89f36e4b 100644
--- a/bu_isciii/archive.py
+++ b/bu_isciii/archive.py
@@ -224,7 +224,7 @@ def __init__(
             try:
                 for service in rest_api.get_request(
                     request_info="services",
-                    safe=False,
+                    safe=True,
                     state="delivered",
                     date_from=str(self.date_from),
                     date_until=str(self.date_until),
@@ -259,7 +259,7 @@ def __init__(
                 if isinstance(
                     (
                         service_data := rest_api.get_request(
-                            request_info="service-data", safe=False, service=service
+                            request_info="service-data", safe=True, service=service
                         )
                     ),
                     int,
diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index a66ecd282..5583ab8a8 100755
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -77,7 +77,7 @@ def __init__(
             conf_api["server"], conf_api["api_url"], api_user, api_password
         )
         self.resolution_info = self.rest_api.get_request(
-            request_info="service-data", safe=False, resolution=self.resolution_id
+            request_info="service-data", safe=True, resolution=self.resolution_id
         )
         if self.resolution_info == 404:
             print("Received Error 404 from Iskylims API. Aborting")
@@ -92,7 +92,7 @@ def __init__(
             else:
                 self.post_delivery_info()
         self.resolution_info = self.rest_api.get_request(
-            request_info="service-data", safe=False, resolution=self.resolution_id
+            request_info="service-data", safe=True, resolution=self.resolution_id
         )
         self.services_requested = self.resolution_info["resolutions"][0][
             "available_services"
diff --git a/bu_isciii/clean.py b/bu_isciii/clean.py
index 63a42b8bc..6536c306a 100644
--- a/bu_isciii/clean.py
+++ b/bu_isciii/clean.py
@@ -47,7 +47,7 @@ def __init__(
             conf_api["server"], conf_api["api_url"], api_user, api_password
         )
         self.resolution_info = rest_api.get_request(
-            request_info="service-data", safe=False, resolution=self.resolution_id
+            request_info="service-data", safe=True, resolution=self.resolution_id
         )
         self.service_folder = self.resolution_info["resolutions"][0][
             "resolution_full_number"
diff --git a/bu_isciii/copy_sftp.py b/bu_isciii/copy_sftp.py
index cfd2b3890..9474b59be 100644
--- a/bu_isciii/copy_sftp.py
+++ b/bu_isciii/copy_sftp.py
@@ -50,7 +50,7 @@ def __init__(
         )
 
         self.resolution_info = rest_api.get_request(
-            request_info="service-data", safe=False, resolution=self.resolution_id
+            request_info="service-data", safe=True, resolution=self.resolution_id
         )
         if sftp_folder is None:
             self.sftp_folder = bu_isciii.utils.get_sftp_folder(
diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index f57e301da..0bcf65561 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -54,7 +54,7 @@ def __init__(
             conf_api["server"], conf_api["api_url"], api_user, api_password
         )
         self.resolution_info = self.rest_api.get_request(
-            request_info="service-data", safe=False, resolution=self.resolution_id
+            request_info="service-data", safe=True, resolution=self.resolution_id
         )
         self.service_folder = self.resolution_info["resolutions"][0][
             "resolution_full_number"
@@ -210,7 +210,6 @@ def create_symbolic_links(self):
                         "[red]ERROR: Symbolic links creation failed for file %s." % file
                     )
                     stderr.print("Traceback: %s" % e)
-                    continue
 
     def samples_json(self):
         json_samples = json.dumps(self.service_samples, indent=4)
diff --git a/bu_isciii/scratch.py b/bu_isciii/scratch.py
index 9f2a9984f..d165c8e92 100755
--- a/bu_isciii/scratch.py
+++ b/bu_isciii/scratch.py
@@ -64,7 +64,7 @@ def __init__(
         self.conf = conf.get_configuration("scratch_copy")
 
         self.resolution_info = rest_api.get_request(
-            request_info="service-data", safe=False, resolution=self.resolution_id
+            request_info="service-data", safe=True, resolution=self.resolution_id
         )
         self.service_folder = self.resolution_info["resolutions"][0][
             "resolution_full_number"

From bb50952036e477e66e257fe707c2e91639b041e8 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 27 Jun 2024 10:29:18 +0200
Subject: [PATCH 061/321] Fixed possible error when type does not exist in json

---
 bu_isciii/clean.py | 13 ++++++++++---
 1 file changed, 10 insertions(+), 3 deletions(-)

diff --git a/bu_isciii/clean.py b/bu_isciii/clean.py
index 6536c306a..dbc6625c5 100644
--- a/bu_isciii/clean.py
+++ b/bu_isciii/clean.py
@@ -129,9 +129,16 @@ def get_clean_items(self, services_ids, type="files"):
         for service in services_ids:
             try:
                 items = service_conf.get_find_deep(service, type)
-                for item in items:
-                    if item not in clean_items_list:
-                        clean_items_list.append(item)
+                if items:
+                    for item in items:
+                        if item not in clean_items_list:
+                            clean_items_list.append(item)
+                else:
+                    stderr.print(
+                        "[red]ERROR: Service type %s not found in services json file for service %s."
+                        % (type,service)
+                    )
+                    sys.exit()
             except KeyError as e:
                 stderr.print(
                     "[red]ERROR: Service id %s not found in services json file."

From 387e4f48c3f3d40559de988f04923f8df25b3e32 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 27 Jun 2024 10:30:04 +0200
Subject: [PATCH 062/321] Fixed black

---
 bu_isciii/clean.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/clean.py b/bu_isciii/clean.py
index dbc6625c5..cc514628a 100644
--- a/bu_isciii/clean.py
+++ b/bu_isciii/clean.py
@@ -136,7 +136,7 @@ def get_clean_items(self, services_ids, type="files"):
                 else:
                     stderr.print(
                         "[red]ERROR: Service type %s not found in services json file for service %s."
-                        % (type,service)
+                        % (type, service)
                     )
                     sys.exit()
             except KeyError as e:

From d01ac11edb191940d439c0ea439bb30da634d3ec Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Wed, 26 Jun 2024 15:44:16 +0200
Subject: [PATCH 063/321] Created 03-armfinderplus and lablog

---
 .../ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog    | 7 +++++++
 1 file changed, 7 insertions(+)
 create mode 100644 bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog
new file mode 100644
index 000000000..7ef828b00
--- /dev/null
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog
@@ -0,0 +1,7 @@
+# conda activate amrfinder
+
+# Only works with assemblies, prior to this you must have executed assembly pipeline
+
+scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
+
+cat ../samples_id.txt | while read in; do echo "srun --chdir $scratch_dir --partition middle_idx amrfinder -n $(ls ../../*ANALYSIS*ASSEMBLY/03-assembly/unicycler/${in}.fasta.gz)  --organism Clostridioides_difficile --name ${in} --plus -o ${in}_out &" >> _01_run_amrfinder.sh; done
\ No newline at end of file

From 4ac57c34cdafdea65f20cef5877b41d6207d5f12 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Wed, 26 Jun 2024 16:36:07 +0200
Subject: [PATCH 064/321] Added organism selection when lablog executed

---
 .../03-armfinderplus/lablog                    | 18 +++++++++++++++++-
 1 file changed, 17 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog
index 7ef828b00..19920152a 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog
@@ -4,4 +4,20 @@
 
 scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
 
-cat ../samples_id.txt | while read in; do echo "srun --chdir $scratch_dir --partition middle_idx amrfinder -n $(ls ../../*ANALYSIS*ASSEMBLY/03-assembly/unicycler/${in}.fasta.gz)  --organism Clostridioides_difficile --name ${in} --plus -o ${in}_out &" >> _01_run_amrfinder.sh; done
\ No newline at end of file
+possible_organisms=("Acinetobacter_baumannii" "Burkholderia_cepacia" "Burkholderia_pseudomallei" "Campylobacter" "Citrobacter_freundii" "Clostridioides_difficile" "Enterobacter_asburiae" "Enterobacter_cloacae" "Enterococcus_faecalis" "Enterococcus_faecium" "Escherichia" "Klebsiella_oxytoca" "Klebsiella_pneumoniae" "Neisseria_gonorrhoeae" "Neisseria_meningitidis" "Pseudomonas_aeruginosa" "Salmonella" "Serratia_marcescens" "Staphylococcus_aureus" "Staphylococcus_pseudintermedius" "Streptococcus_agalactiae" "Streptococcus_pneumoniae" "Streptococcus_pyogenes" "Vibrio_cholerae" "Vibrio_parahaemolyticus" "Vibrio_vulnificus" "OTHER")
+
+echo "Please select your bacteria from the following list:"
+PS3=$(echo -e "\n\033[1;37mSelect number:\033[0m ")
+select bacteria in "${possible_organisms[@]}"; do
+    if [[ -n "$bacteria" ]]; then
+        echo -e "\033[0;32mOrganism selected: ${bacteria}\033[0m"
+        if [ $bacteria = "OTHER" ]; then
+            cat ../samples_id.txt | while read in; do echo "srun --chdir $scratch_dir --partition middle_idx amrfinder -n $(ls ../../*ANALYSIS*ASSEMBLY/03-assembly/unicycler/${in}.fasta.gz)  --name ${in} --plus -o ${in}_out &" >> _01_run_amrfinder.sh; done
+        else
+            cat ../samples_id.txt | while read in; do echo "srun --chdir $scratch_dir --partition middle_idx amrfinder -n $(ls ../../*ANALYSIS*ASSEMBLY/03-assembly/unicycler/${in}.fasta.gz)  --organism ${bacteria} --name ${in} --plus -o ${in}_out &" >> _01_run_amrfinder.sh; done
+        fi
+        break
+    else
+        echo -e "\n\033[0;31mInvalid input.\033[0m"
+    fi
+done
\ No newline at end of file

From 30cf68f8ebd53382c3e9ec24465a8b4a311fb9e6 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Wed, 26 Jun 2024 16:44:12 +0200
Subject: [PATCH 065/321] Added some format

---
 .../ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog       | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog
index 19920152a..981b66fa6 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog
@@ -5,8 +5,8 @@
 scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
 
 possible_organisms=("Acinetobacter_baumannii" "Burkholderia_cepacia" "Burkholderia_pseudomallei" "Campylobacter" "Citrobacter_freundii" "Clostridioides_difficile" "Enterobacter_asburiae" "Enterobacter_cloacae" "Enterococcus_faecalis" "Enterococcus_faecium" "Escherichia" "Klebsiella_oxytoca" "Klebsiella_pneumoniae" "Neisseria_gonorrhoeae" "Neisseria_meningitidis" "Pseudomonas_aeruginosa" "Salmonella" "Serratia_marcescens" "Staphylococcus_aureus" "Staphylococcus_pseudintermedius" "Streptococcus_agalactiae" "Streptococcus_pneumoniae" "Streptococcus_pyogenes" "Vibrio_cholerae" "Vibrio_parahaemolyticus" "Vibrio_vulnificus" "OTHER")
-
-echo "Please select your bacteria from the following list:"
+echo
+echo -e "\n\033[1;37mPlease select your bacteria from the following list:\033[0m"
 PS3=$(echo -e "\n\033[1;37mSelect number:\033[0m ")
 select bacteria in "${possible_organisms[@]}"; do
     if [[ -n "$bacteria" ]]; then

From a838fb8f577d98fce9c3f643a7000176ee68f977 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Wed, 26 Jun 2024 17:13:23 +0200
Subject: [PATCH 066/321] Modified lablog_characterization_results including
 amrfinderplus files

---
 .../RESULTS/lablog_characterization_results          | 12 +++++++-----
 1 file changed, 7 insertions(+), 5 deletions(-)

diff --git a/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results b/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results
index 8879a843b..6a41c5703 100644
--- a/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results
+++ b/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results
@@ -1,12 +1,14 @@
-DELIVERY_FOLDER="$(date '+%Y%m%d')_entrega"
+DELIVERY_FOLDER="$(date '+%Y%m%d')_entrega01"
 
-mkdir -p $DELIVERY_FOLDER
-mkdir "${DELIVERY_FOLDER}/characterization"
+mkdir -p "${DELIVERY_FOLDER}/characterization/amrfinderplus"
 
 # ARIBA characterization service
 cd $DELIVERY_FOLDER/characterization
 ln -s ../../../ANALYSIS/*CHARACTERIZATION/99-stats/ariba_*.tsv .
 ln -s ../../../ANALYSIS/*CHARACTERIZATION/99-stats/ariba_*.csv .
-find . -xtype l -delete
 
-cd -
+cd amrfinderplus
+find ../../../../ANALYSIS/*CHARACTERIZATION/*amrfinderplus -name '*_out' -exec bash -c 'ln -s "$1" "$(basename "${1%_out}.tsv")"' _ {} \;
+find .. -xtype l -delete
+
+cd ../..

From 03d3e3ce275cd214baf54d74e3551a2363a93af8 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Wed, 26 Jun 2024 17:15:38 +0200
Subject: [PATCH 067/321] Renamed 03-amrfinderplus folder

---
 .../{03-armfinderplus => 03-amrfinderplus}/lablog                 | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 rename bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/{03-armfinderplus => 03-amrfinderplus}/lablog (100%)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog
similarity index 100%
rename from bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-armfinderplus/lablog
rename to bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog

From ebd448ede3b956c569d3ead94ebb7a84b79c9504 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 27 Jun 2024 13:28:49 +0200
Subject: [PATCH 068/321] Fixed changelog conflict

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index f9a97e31a..5aae27a46 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -49,6 +49,7 @@ Code contributions to the new version:
 - Updated characterization and snippy templates to fit bacass pipeline. Corrected path in 05-iqtree in snippy template. [#283](https://github.com/BU-ISCIII/buisciii-tools/pull/283)
 - Included multiqc_report.html in RESULTS folder in every service, where necessary [#265] (https://github.com/BU-ISCIII/buisciii-tools/pull/265)
 - Added MAG tempalte and removed MAG from other templates [#288](https://github.com/BU-ISCIII/buisciii-tools/pull/288)
+- Added amrfinderplus to characterization template. [#289] (https://github.com/BU-ISCIII/buisciii-tools/pull/289)
 
 ### Modules
 

From d65b97727a46bbdfa688de5fe1d0d04f3af1d783 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 27 Jun 2024 09:12:53 +0200
Subject: [PATCH 069/321] Added tsv extension to output files for amrfinderplus

---
 .../ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog       | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog
index 981b66fa6..a75150202 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog
@@ -12,9 +12,9 @@ select bacteria in "${possible_organisms[@]}"; do
     if [[ -n "$bacteria" ]]; then
         echo -e "\033[0;32mOrganism selected: ${bacteria}\033[0m"
         if [ $bacteria = "OTHER" ]; then
-            cat ../samples_id.txt | while read in; do echo "srun --chdir $scratch_dir --partition middle_idx amrfinder -n $(ls ../../*ANALYSIS*ASSEMBLY/03-assembly/unicycler/${in}.fasta.gz)  --name ${in} --plus -o ${in}_out &" >> _01_run_amrfinder.sh; done
+            cat ../samples_id.txt | while read in; do echo "srun --chdir $scratch_dir --partition middle_idx amrfinder -n $(ls ../../*ANALYSIS*ASSEMBLY/03-assembly/unicycler/${in}.fasta.gz)  --name ${in} --plus -o ${in}_out.tsv &" >> _01_run_amrfinder.sh; done
         else
-            cat ../samples_id.txt | while read in; do echo "srun --chdir $scratch_dir --partition middle_idx amrfinder -n $(ls ../../*ANALYSIS*ASSEMBLY/03-assembly/unicycler/${in}.fasta.gz)  --organism ${bacteria} --name ${in} --plus -o ${in}_out &" >> _01_run_amrfinder.sh; done
+            cat ../samples_id.txt | while read in; do echo "srun --chdir $scratch_dir --partition middle_idx amrfinder -n $(ls ../../*ANALYSIS*ASSEMBLY/03-assembly/unicycler/${in}.fasta.gz)  --organism ${bacteria} --name ${in} --plus -o ${in}_out.tsv &" >> _01_run_amrfinder.sh; done
         fi
         break
     else

From 4d44862110b5c45be2bfafd0a47c84f37ffb1ce2 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 27 Jun 2024 09:16:23 +0200
Subject: [PATCH 070/321] Modified lablog_characterization_results in order to
 creating symlinks for tsv files in amrfinderplus analysis

---
 .../characterization/RESULTS/lablog_characterization_results    | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results b/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results
index 6a41c5703..a12cfbd96 100644
--- a/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results
+++ b/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results
@@ -8,7 +8,7 @@ ln -s ../../../ANALYSIS/*CHARACTERIZATION/99-stats/ariba_*.tsv .
 ln -s ../../../ANALYSIS/*CHARACTERIZATION/99-stats/ariba_*.csv .
 
 cd amrfinderplus
-find ../../../../ANALYSIS/*CHARACTERIZATION/*amrfinderplus -name '*_out' -exec bash -c 'ln -s "$1" "$(basename "${1%_out}.tsv")"' _ {} \;
+ln -s ../../../../ANALYSIS/*CHARACTERIZATION/*amrfinderplus/*tsv .
 find .. -xtype l -delete
 
 cd ../..

From e63981b38f891d11a9b042bd4219d98e82bdbbfc Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 18 Jun 2024 14:13:30 +0200
Subject: [PATCH 071/321] Updated plasmidid lablog

---
 .../templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/lablog  | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/lablog b/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/lablog
index bc11143f8..b6d0b61ec 100644
--- a/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/lablog
+++ b/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/lablog
@@ -4,6 +4,6 @@ mkdir logs
 scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
 ln -s ../samples_id.txt .
 
-cat ../samples_id.txt | xargs -I @@ echo "srun --chdir $scratch_dir --output logs/PLASMIDID.@@.%j.log --job-name PLASMIDID_@@ --partition short_idx --time 05:00:00 env - PATH="$PATH" singularity exec --bind /data/bi/references/ --bind ${scratch_dir} --bind ${scratch_dir}/../../ /scratch/bi/singularity-images/depot.galaxyproject.org-singularity-plasmidid-1.6.5--hdfd78af_0.img plasmidID -1 ${scratch_dir}/../*ASSEMBLY/01-preprocessing/trimmed_sequences/@@_1.trim.fastq.gz -2 ${scratch_dir}/../*ASSEMBLY/01-preprocessing/trimmed_sequences/@@_2.trim.fastq.gz -d /data/bi/references/plasmidID/plasmid_ddbb/20200203/20200203_plasmids.fasta -s @@ -c ${scratch_dir}/../*ASSEMBLY/03-assembly/unicycler/@@.fasta -a ${scratch_dir}/plasmidID_annotation_config_file.txt --no-trim -o ${scratch_dir} &" > _01_plasmidID.sh
+cat ../samples_id.txt | xargs -I @@ echo "srun --chdir $scratch_dir --output logs/PLASMIDID.@@.%j.log --job-name PLASMIDID_@@ --partition short_idx --time 05:00:00 env - PATH="$PATH" singularity exec --bind /data/bi/references/ --bind ${scratch_dir} --bind ${scratch_dir}/../../ /data/bi/pipelines/singularity-images/depot.galaxyproject.org-singularity-plasmidid-1.6.5--hdfd78af_0.img plasmidID -1 ${scratch_dir}/../*ASSEMBLY/01-processing/fastp/@@_1.fastp.fastq.gz -2 ${scratch_dir}/../*ASSEMBLY/01-processing/fastp/@@_2.fastp.fastq.gz -d /data/bi/references/plasmidID/plasmid_ddbb/20200203/20200203_plasmids.fasta -s @@ -c ${scratch_dir}/../*ASSEMBLY/03-assembly/unicycler/@@.fasta -a ${scratch_dir}/plasmidID_annotation_config_file.txt --no-trim -o ${scratch_dir} &" > _01_plasmidID.sh
 
-echo "srun --chdir $scratch_dir --partition short_idx --time 1:00:00 --output logs/SUMMARY.%j.log /data/bi/pipelines/plasmidID/bin/summary_report_pid.py -i NO_GROUP -g &" > _02_summary_table.sh
+echo "srun --chdir $scratch_dir --partition short_idx --time 1:00:00 --output logs/SUMMARY.%j.log env - PATH="$PATH" singularity exec --bind /data/bi/references/ --bind ${scratch_dir} --bind ${scratch_dir}/../../ /data/bi/pipelines/singularity-images/depot.galaxyproject.org-singularity-plasmidid-1.6.5--hdfd78af_0.img summary_report_pid.py -i NO_GROUP -g &" > _02_summary_table.sh

From 84607b44d6b31249ccfcdfae4e18bc0a9beaf63c Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 18 Jun 2024 14:17:05 +0200
Subject: [PATCH 072/321] Modified pipelines paths where necessary

---
 .../IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog          | 4 ++--
 .../templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog    | 2 +-
 .../freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog         | 2 +-
 .../ANALYSIS/ANALYSIS01_RBPANEL/07-annotation/lablog          | 2 +-
 .../mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/02-kmerfinder/lablog    | 2 +-
 .../templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog  | 2 +-
 .../templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog   | 2 +-
 .../seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog  | 2 +-
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon     | 4 ++--
 bu_isciii/templates/viralrecon/DOC/viralrecon.config          | 2 +-
 .../templates/viralrecon/DOC/viralrecon_sars_nanopore.config  | 4 ++--
 .../viralrecon/DOC/viralrecon_sars_nanopore_params.yml        | 4 ++--
 12 files changed, 16 insertions(+), 16 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
index 01c499462..c694a5b91 100755
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
@@ -5,7 +5,7 @@ mkdir logs
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --cpus-per-task 32 --mem 35000M --chdir $scratch_dir --time 01:00:00 --output logs/IRMA.${in}.%j.log /data/bi/pipelines/flu-amd-202402/IRMA FLU_AD ../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz ${in} --external-config ../../../DOC/irma_config.sh &"; done > _01_irma.sh
+cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --cpus-per-task 32 --mem 35000M --chdir $scratch_dir --time 01:00:00 --output logs/IRMA.${in}.%j.log /data/bi/pipelines/flu-amd/flu-amd-1.1.4/IRMA FLU_AD ../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz ${in} --external-config ../../../DOC/irma_config.sh &"; done > _01_irma.sh
 
 echo 'bash create_irma_stats.sh' > _02_create_stats.sh
 
@@ -32,4 +32,4 @@ echo 'grep -w 'C__' irma_stats.txt | cut -f1 | while read sample; do cat C_fragm
 echo 'cat ../samples_id.txt | while read in; do cat ${in}/*.fasta | sed "s/^>/\>${in}_/g" | sed 's/_H1//g' | sed 's/_H3//g' | sed 's/_N1//g' | sed 's/_N2//g' | sed 's@-@/@g' | sed 's/_A_/_/g' | sed 's/_B_/_/g' | sed 's/_C_/_/g' >> all_samples_completo.txt; done' >> _03_post_processing.sh
 
 echo 'sed "s/__//g" irma_stats.txt > clean_irma_stats.txt' >> _03_post_processing.sh
-echo 'sed "s/_\t/\t/g" irma_stats.txt > clean_irma_stats.txt' >> _03_post_processing.sh
\ No newline at end of file
+echo 'sed "s/_\t/\t/g" irma_stats.txt > clean_irma_stats.txt' >> _03_post_processing.sh
diff --git a/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog b/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
index bd8f8549a..25e84ab36 100644
--- a/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
+++ b/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
@@ -107,7 +107,7 @@ cat <<EOF > assembly.sbatch
 # module load Nextflow/23.10.0 singularity
 export NXF_OPTS="-Xms500M -Xmx8G"
 
-nextflow run /data/bi/pipelines/nf-core-bacass/main.nf \\
+nextflow run /data/bi/pipelines/nf-core-bacass/nf-core-bacass-2.2.0dev/main.nf \\
         -c ../../DOC/hpc_slurm_assembly.config \\
         -profile singularity \\
         --input samplesheet.csv \\
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog
index 84c6c6dfa..77a8c99b7 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog
@@ -17,7 +17,7 @@ cat <<EOF > mag.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /scratch/bi/pipelines/nf-core-mag-2.1.1/workflow/main.nf \\
+nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-2.1.1/workflow/main.nf \\
           -c ../../DOC/mag.config \\
           --input '00-reads/*_R{1,2}.fastq.gz' \\
           --outdir $(date '+%Y%m%d')_mag \\
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/07-annotation/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/07-annotation/lablog
index 29a8a8cbd..584fe9b36 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/07-annotation/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/07-annotation/lablog
@@ -27,7 +27,7 @@ echo "sbatch bcftools_query.sbatch" > _01_bcftools_query.sh
 
 
 # module load Java/1.8.0_281 R/4.1.0-foss-2021a
-cat ../samples_id.txt | xargs -I @@ echo "mkdir @@;srun --chdir ${scratch_dir} --output logs/KGGSEQ.@@.%j.log --job-name KGGSEQ --cpus-per-task 1 --mem 8192 --partition short_idx --time 02:00:00 java -jar -Xmx8g /data/bi/pipelines/kggseqhg19/kggseq.jar --no-web --buildver hg19 --vcf-file ../06-VarScan/@@/@@.vcf.gz --db-gene refgene --db-score dbnsfp --genome-annot --db-filter ESP5400,dbsnp141,1kg201305 --rare-allele-freq 1 --mendel-causing-predict best --omim-annot --out @@/@@_annot.txt --no-qc &" > _02_kggseq.sh
+cat ../samples_id.txt | xargs -I @@ echo "mkdir @@;srun --chdir ${scratch_dir} --output logs/KGGSEQ.@@.%j.log --job-name KGGSEQ --cpus-per-task 1 --mem 8192 --partition short_idx --time 02:00:00 java -jar -Xmx8g /data/bi/pipelines/kggseq/kggseqhg19/kggseq.jar --no-web --buildver hg19 --vcf-file ../06-VarScan/@@/@@.vcf.gz --db-gene refgene --db-score dbnsfp --genome-annot --db-filter ESP5400,dbsnp141,1kg201305 --rare-allele-freq 1 --mendel-causing-predict best --omim-annot --out @@/@@_annot.txt --no-qc &" > _02_kggseq.sh
 cat ../samples_id.txt | xargs -I % echo "gunzip %/%_annot.txt.flt.txt.gz" > _03_final_table.sh
 cat ../samples_id.txt | xargs -I % echo 'cp header %/%_header.table && tail -n +2 %/%.table >> %/%_header.table'  >> _03_final_table.sh
 cat ../samples_id.txt | xargs -I % echo "Rscript merge_parse.R %" >> _03_final_table.sh
diff --git a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/02-kmerfinder/lablog b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/02-kmerfinder/lablog
index ea7174d24..eff310bb1 100644
--- a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/02-kmerfinder/lablog
+++ b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/02-kmerfinder/lablog
@@ -4,7 +4,7 @@ scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
 mkdir logs
 
-cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir ${scratch_dir} --mem 50G --output logs/KMERFINDER.${in}.%j.log singularity run -B /scratch/bi/ -B /data/bi/references/kmerfinder/20190108_stable_dirs/bacteria /scratch/bi/pipelines/kmerfinder_v3.0.simg -i ../01-preprocessing/${in}/${in}_R1_filtered.fastq.gz ../01-preprocessing/${in}/${in}_R2_filtered.fastq.gz -o ${scratch_dir}/${in} -db /data/bi/references/kmerfinder/20190108_stable_dirs/bacteria/bacteria.ATG -tax /data/bi/references/kmerfinder/20190108_stable_dirs/bacteria/bacteria.name -x &";done > _01_kmerfinder.sh
+cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir ${scratch_dir} --mem 50G --output logs/KMERFINDER.${in}.%j.log singularity run -B /scratch/bi/ -B /data/bi/references/kmerfinder/20190108_stable_dirs/bacteria /data/bi/pipelines/singularity-images/kmerfinder_v3.0.simg -i ../01-preprocessing/${in}/${in}_R1_filtered.fastq.gz ../01-preprocessing/${in}/${in}_R2_filtered.fastq.gz -o ${scratch_dir}/${in} -db /data/bi/references/kmerfinder/20190108_stable_dirs/bacteria/bacteria.ATG -tax /data/bi/references/kmerfinder/20190108_stable_dirs/bacteria/bacteria.name -x &";done > _01_kmerfinder.sh
 
 echo "cat ../samples_id.txt | xargs -I % awk '{FS=\"\t\"} NR==2 {print \$1}' %/results.txt | awk '{count[\$0]++} END{for (i in count) {print count[i], i}}' | sort -nr" > _02_find_common_reference.sh
 
diff --git a/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog b/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog
index c91b4010f..ef1be3ced 100644
--- a/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog
+++ b/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog
@@ -20,7 +20,7 @@ cat <<EOF > pikavirus.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /scratch/bi/pipelines/PikaVirus/main.nf \\
+nextflow run /data/bi/pipelines/pikavirus/PikaVirus/main.nf \\
           -c ../../DOC/hpc_slurm_pikavirus.config \\
           --input samplesheet.csv \\
           --kraken_scouting false \\
diff --git a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog
index d0674cda9..a39b66986 100644
--- a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog
+++ b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog
@@ -19,7 +19,7 @@ cat <<EOF > rnaseq.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-/data/bi/pipelines/nf-core-rnaseq-3.10.1/workflow/main.nf \\
+/data/bi/pipelines/nf-core-rnaseq/nf-core-rnaseq-3.10.1/workflow/main.nf \\
           -c ../../DOC/hpc_slurm_rnaseq.config \\
           -params-file ../../DOC/hg38_ensmbl_rnaseq.yml \\
           --input samplesheet.csv \\
diff --git a/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog b/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog
index a960ff2e3..87cdb1f10 100644
--- a/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog
+++ b/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog
@@ -21,7 +21,7 @@ cat <<EOF > seek_destroy.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /scratch/bi/pipelines/Seek-Destroy/main.nf  \\
+nextflow run /data/bi/pipelines/seek-destroy-nf/main.nf  \\
           -c ../../DOC/seek_destroy.config \\
           --input samplesheet.csv \\
 	  --scout_database /data/bi/references/kraken/minikraken_8GB_20200312.tgz \\
diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index f63925f21..3a81fc18a 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -363,7 +363,7 @@ do
         echo "#SBATCH --output ${ref}_$(date '+%Y%m%d')_viralrecon.log" >> ${FOLDER_NAME}/lablog
         printf "#SBATCH --chdir \$scratch_dir\n\n" >> ${FOLDER_NAME}/lablog
         printf 'export NXF_OPTS="-Xms500M -Xmx4G"\n\n' >> ${FOLDER_NAME}/lablog
-        echo "nextflow run /data/bi/pipelines/nf-core-viralrecon-2.6.0/workflow/main.nf \\\\" >> ${FOLDER_NAME}/lablog
+        echo "nextflow run /data/bi/pipelines/nf-core-viralrecon/nf-core-viralrecon-2.6.0/workflow/main.nf \\\\" >> ${FOLDER_NAME}/lablog
         echo "          -c ../${CONFIG_FILE} \\\\" >> ${FOLDER_NAME}/lablog
         echo "          -params-file ../${PARAMS_FILE} \\\\" >> ${FOLDER_NAME}/lablog
         echo "          --input samplesheet_${ref}.csv \\\\" >> ${FOLDER_NAME}/lablog
@@ -403,4 +403,4 @@ rm percentajeNs.py
 rm _02_create_run_percentage_Ns.sh
 cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R1*.fastq.gz %_R1.fastq.gz" | bash; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R2*.fastq.gz %_R2.fastq.gz" | bash; cd ..
 
-echo_green "\nLablog_viralrecon execution has been completed successfully!"
\ No newline at end of file
+echo_green "\nLablog_viralrecon execution has been completed successfully!"
diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon.config b/bu_isciii/templates/viralrecon/DOC/viralrecon.config
index 564f23d33..ea6317c97 100644
--- a/bu_isciii/templates/viralrecon/DOC/viralrecon.config
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon.config
@@ -1,7 +1,7 @@
 singularity {
 	enabled = true
 	autoMounts = true
-        runOptions = '-B /data/bi/references/ -B /data/bi/pipelines/artic-ncov2019/ -B "$HOME"'
+        runOptions = '-B /data/bi/references/ -B /data/bi/pipelines/artic-ncov2019/artic-ncov2019/ -B "$HOME"'
 }
 
 process {
diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config
index 31ca69413..c844e28dd 100644
--- a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config
@@ -1,7 +1,7 @@
 singularity {
 	enabled = true
 	autoMounts = true
-        runOptions = '-B /data/bi/references/ -B /data/bi/pipelines/artic-ncov2019/'
+        runOptions = '-B /data/bi/references/ -B /data/bi/pipelines/artic-ncov2019/artic-ncov2019/'
 }
 
 process {
@@ -10,7 +10,7 @@ process {
         withName: 'ARTIC_MINION' {
             ext.args = [
                 '--normalise 500',
-                '--scheme-directory /data/bi/pipelines/artic-ncov2019/primer_schemes/',
+                '--scheme-directory /data/bi/pipelines/artic-ncov2019/artic-ncov2019/primer_schemes/',
                 '--medaka'
             ].join(' ').trim()
         }
diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml
index 2ef67955d..c342c8e4e 100644
--- a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml
@@ -2,8 +2,8 @@ platform: 'nanopore'
 protocol: 'amplicon'
 artic_scheme: 'nCoV-2019'
 primer_set_version: 5
-fasta: '/data/bi/pipelines/artic-ncov2019/primer_schemes/nCoV-2019/V5/ESIB-EQA.reference.fasta'
-primer_bed: '/data/bi/pipelines/artic-ncov2019/primer_schemes/nCoV-2019/V5/ESIB-EQA.primer.bed'
+fasta: '/data/bi/pipelines/artic-ncov2019/artic-ncov2019/primer_schemes/nCoV-2019/V5/ESIB-EQA.reference.fasta'
+primer_bed: '/data/bi/pipelines/artic-ncov2019/artic-ncov2019/primer_schemes/nCoV-2019/V5/ESIB-EQA.primer.bed'
 primer_fasta: '../../RAW/ESIB_EQA_2023.SARS1/ESIB_EQA_2023.SARS1.primers.fasta'
 kraken2_db: '/data/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz'
 nextclade_dataset_name: 'sars-cov-2'

From 40b82c3adcc7e03e44d40fbd979621e3e62673ff Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 18 Jun 2024 14:35:55 +0200
Subject: [PATCH 073/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 5aae27a46..abaf2f21a 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -50,6 +50,7 @@ Code contributions to the new version:
 - Included multiqc_report.html in RESULTS folder in every service, where necessary [#265] (https://github.com/BU-ISCIII/buisciii-tools/pull/265)
 - Added MAG tempalte and removed MAG from other templates [#288](https://github.com/BU-ISCIII/buisciii-tools/pull/288)
 - Added amrfinderplus to characterization template. [#289] (https://github.com/BU-ISCIII/buisciii-tools/pull/289)
+- Updated all files so that paths referring to /pipelines/ are updated according to the new structure [#287](https://github.com/BU-ISCIII/buisciii-tools/pull/287)
 
 ### Modules
 

From 0211853aff1c25bad81a279ae821dec0cd3c03c6 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 18 Jun 2024 15:55:58 +0200
Subject: [PATCH 074/321] Modified some auxiliar viralrecon files

---
 bu_isciii/templates/viralrecon/DOC/viralrecon.config          | 2 +-
 .../templates/viralrecon/DOC/viralrecon_sars_nanopore.config  | 4 ++--
 .../viralrecon/DOC/viralrecon_sars_nanopore_params.yml        | 4 ++--
 3 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon.config b/bu_isciii/templates/viralrecon/DOC/viralrecon.config
index ea6317c97..bc862c2e5 100644
--- a/bu_isciii/templates/viralrecon/DOC/viralrecon.config
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon.config
@@ -1,7 +1,7 @@
 singularity {
 	enabled = true
 	autoMounts = true
-        runOptions = '-B /data/bi/references/ -B /data/bi/pipelines/artic-ncov2019/artic-ncov2019/ -B "$HOME"'
+        runOptions = '-B /data/bi/references/ -B /data/bi/pipelines/artic-ncov2019/artic-ncov2019_v0/ -B "$HOME"'
 }
 
 process {
diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config
index c844e28dd..03ef609e4 100644
--- a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config
@@ -1,7 +1,7 @@
 singularity {
 	enabled = true
 	autoMounts = true
-        runOptions = '-B /data/bi/references/ -B /data/bi/pipelines/artic-ncov2019/artic-ncov2019/'
+        runOptions = '-B /data/bi/references/ -B /data/bi/pipelines/artic-ncov2019/artic-ncov2019_v0/'
 }
 
 process {
@@ -10,7 +10,7 @@ process {
         withName: 'ARTIC_MINION' {
             ext.args = [
                 '--normalise 500',
-                '--scheme-directory /data/bi/pipelines/artic-ncov2019/artic-ncov2019/primer_schemes/',
+                '--scheme-directory /data/bi/pipelines/artic-ncov2019/artic-ncov2019_v0/primer_schemes/',
                 '--medaka'
             ].join(' ').trim()
         }
diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml
index c342c8e4e..56c95cbf4 100644
--- a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml
@@ -2,8 +2,8 @@ platform: 'nanopore'
 protocol: 'amplicon'
 artic_scheme: 'nCoV-2019'
 primer_set_version: 5
-fasta: '/data/bi/pipelines/artic-ncov2019/artic-ncov2019/primer_schemes/nCoV-2019/V5/ESIB-EQA.reference.fasta'
-primer_bed: '/data/bi/pipelines/artic-ncov2019/artic-ncov2019/primer_schemes/nCoV-2019/V5/ESIB-EQA.primer.bed'
+fasta: '/data/bi/pipelines/artic-ncov2019/artic-ncov2019_v0/primer_schemes/nCoV-2019/V5/ESIB-EQA.reference.fasta'
+primer_bed: '/data/bi/pipelines/artic-ncov2019/artic-ncov2019_v0/primer_schemes/nCoV-2019/V5/ESIB-EQA.primer.bed'
 primer_fasta: '../../RAW/ESIB_EQA_2023.SARS1/ESIB_EQA_2023.SARS1.primers.fasta'
 kraken2_db: '/data/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz'
 nextclade_dataset_name: 'sars-cov-2'

From 8ab181283966c64a1c936e8c9dcf079e5e8cc65d Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 27 Jun 2024 13:26:29 +0200
Subject: [PATCH 075/321] Fixed some routes in a few templates and auxiliar
 files

---
 bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog        | 2 +-
 .../templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog  | 2 +-
 .../seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog  | 2 +-
 bu_isciii/templates/viralrecon/DOC/viralrecon.config          | 2 +-
 .../templates/viralrecon/DOC/viralrecon_sars_nanopore.config  | 4 ++--
 .../viralrecon/DOC/viralrecon_sars_nanopore_params.yml        | 4 ++--
 6 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog
index 39408a717..d68708d31 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog
@@ -18,7 +18,7 @@ cat <<EOF > mag.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-2.1.1/workflow/main.nf \\
+nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-2.5.3/workflow/main.nf \\
           -c ../../DOC/mag.config \\
           --input '00-reads/*_R{1,2}.fastq.gz' \\
           --outdir $(date '+%Y%m%d')_mag \\
diff --git a/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog b/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog
index ef1be3ced..83da38684 100644
--- a/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog
+++ b/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog
@@ -20,7 +20,7 @@ cat <<EOF > pikavirus.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/pikavirus/PikaVirus/main.nf \\
+nextflow run /data/bi/pipelines/pikavirus/pikavirus-1.0dev/main.nf \\
           -c ../../DOC/hpc_slurm_pikavirus.config \\
           --input samplesheet.csv \\
           --kraken_scouting false \\
diff --git a/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog b/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog
index 87cdb1f10..381cbe632 100644
--- a/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog
+++ b/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog
@@ -21,7 +21,7 @@ cat <<EOF > seek_destroy.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/seek-destroy-nf/main.nf  \\
+nextflow run /data/bi/pipelines/seek-destroy-nf/seek-destroy-nf-1.0dev/main.nf  \\
           -c ../../DOC/seek_destroy.config \\
           --input samplesheet.csv \\
 	  --scout_database /data/bi/references/kraken/minikraken_8GB_20200312.tgz \\
diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon.config b/bu_isciii/templates/viralrecon/DOC/viralrecon.config
index bc862c2e5..4b5f4e2a5 100644
--- a/bu_isciii/templates/viralrecon/DOC/viralrecon.config
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon.config
@@ -1,7 +1,7 @@
 singularity {
 	enabled = true
 	autoMounts = true
-        runOptions = '-B /data/bi/references/ -B /data/bi/pipelines/artic-ncov2019/artic-ncov2019_v0/ -B "$HOME"'
+        runOptions = '-B /data/bi/references/ -B "$HOME"'
 }
 
 process {
diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config
index 03ef609e4..865d1a0d2 100644
--- a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config
@@ -1,7 +1,7 @@
 singularity {
 	enabled = true
 	autoMounts = true
-        runOptions = '-B /data/bi/references/ -B /data/bi/pipelines/artic-ncov2019/artic-ncov2019_v0/'
+        runOptions = '-B /data/bi/references/'
 }
 
 process {
@@ -10,7 +10,7 @@ process {
         withName: 'ARTIC_MINION' {
             ext.args = [
                 '--normalise 500',
-                '--scheme-directory /data/bi/pipelines/artic-ncov2019/artic-ncov2019_v0/primer_schemes/',
+                '--scheme-directory /data/bi/references/virus/2019-nCoV/primer_schemes/',
                 '--medaka'
             ].join(' ').trim()
         }
diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml
index 56c95cbf4..7134065a0 100644
--- a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml
@@ -2,8 +2,8 @@ platform: 'nanopore'
 protocol: 'amplicon'
 artic_scheme: 'nCoV-2019'
 primer_set_version: 5
-fasta: '/data/bi/pipelines/artic-ncov2019/artic-ncov2019_v0/primer_schemes/nCoV-2019/V5/ESIB-EQA.reference.fasta'
-primer_bed: '/data/bi/pipelines/artic-ncov2019/artic-ncov2019_v0/primer_schemes/nCoV-2019/V5/ESIB-EQA.primer.bed'
+fasta: '/data/bi/references/virus/2019-nCoV/primer_schemes/nCoV-2019/V5/ESIB-EQA.reference.fasta'
+primer_bed: '/data/bi/references/virus/2019-nCoV/primer_schemes/nCoV-2019/V5/ESIB-EQA.primer.bed'
 primer_fasta: '../../RAW/ESIB_EQA_2023.SARS1/ESIB_EQA_2023.SARS1.primers.fasta'
 kraken2_db: '/data/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz'
 nextclade_dataset_name: 'sars-cov-2'

From 0cbb21d76ae7aac6b58a37678d2247f304038e94 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 27 Jun 2024 13:35:57 +0200
Subject: [PATCH 076/321] Updated mag template

---
 .../templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog
index 77a8c99b7..0086364db 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog
@@ -17,7 +17,7 @@ cat <<EOF > mag.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-2.1.1/workflow/main.nf \\
+nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-2.5.3/workflow/main.nf \\
           -c ../../DOC/mag.config \\
           --input '00-reads/*_R{1,2}.fastq.gz' \\
           --outdir $(date '+%Y%m%d')_mag \\

From 841bedd88e3b45ab58bf4dee8ad9f3df66dbb765 Mon Sep 17 00:00:00 2001
From: "github-actions[bot]"
 <41898282+github-actions[bot]@users.noreply.github.com>
Date: Thu, 1 Feb 2024 13:58:18 +0100
Subject: [PATCH 077/321] Merge changes from main into hotfix (#195)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: Sara Monzón <sara.monzon.fdz@gmail.com>

From 18a1fe758a3868ff113f57206806db534aa18e1c Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Mon, 1 Jul 2024 10:59:24 +0200
Subject: [PATCH 078/321] Fixed error because items can be none, empty list, or
 list with content

---
 bu_isciii/clean.py | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/bu_isciii/clean.py b/bu_isciii/clean.py
index cc514628a..f1f14fc67 100644
--- a/bu_isciii/clean.py
+++ b/bu_isciii/clean.py
@@ -129,16 +129,16 @@ def get_clean_items(self, services_ids, type="files"):
         for service in services_ids:
             try:
                 items = service_conf.get_find_deep(service, type)
-                if items:
-                    for item in items:
-                        if item not in clean_items_list:
-                            clean_items_list.append(item)
-                else:
+                if items is None:
                     stderr.print(
                         "[red]ERROR: Service type %s not found in services json file for service %s."
                         % (type, service)
                     )
                     sys.exit()
+                else:
+                    for item in items:
+                        if item not in clean_items_list:
+                            clean_items_list.append(item)
             except KeyError as e:
                 stderr.print(
                     "[red]ERROR: Service id %s not found in services json file."

From fdcc10cf8739f9d9a673936eaac790b444ba55fe Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 4 Jul 2024 09:18:01 +0200
Subject: [PATCH 079/321] Updated assembly's lablog and config files

---
 .../assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog | 16 +++++++---------
 .../assembly/DOC/hpc_slurm_assembly.config       | 16 ++++++++++++++++
 2 files changed, 23 insertions(+), 9 deletions(-)

diff --git a/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog b/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
index 25e84ab36..6124ca630 100644
--- a/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
+++ b/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
@@ -107,25 +107,23 @@ cat <<EOF > assembly.sbatch
 # module load Nextflow/23.10.0 singularity
 export NXF_OPTS="-Xms500M -Xmx8G"
 
-nextflow run /data/bi/pipelines/nf-core-bacass/nf-core-bacass-2.2.0dev/main.nf \\
+nextflow run /data/bi/pipelines/nf-core-bacass/nf-core-bacass-2.3.1/main.nf \\
         -c ../../DOC/hpc_slurm_assembly.config \\
         -profile singularity \\
         --input samplesheet.csv \\
         --outdir ./ \\
-        --assembly_type ${ASSEMBLY_MODE} \\
-        --assembler ${ASSEMBLER} \\
+        --assembly_type short \\
+        --assembler unicycler \\
         --skip_polish true \\
-        --save_trimmed ${SAVETRIMMED} \\
+        --save_trimmed false \\
         --fastp_args '--qualified_quality_phred 20 --cut_mean_quality 20' \\
         --skip_kraken2 true \\
         --skip_kmerfinder false \\
-        --kmerfinderdb /data/bi/references/kmerfinder/20190108_stable_dirs/bacteria \\
-        --ncbi_assembly_metadata /data/bi/references/bacteria/20191212/assembly_summary_bacteria.txt \\
-        ${PROKKA_ARGS} \\
+        --kmerfinderdb /data/bi/references/kmerfinder/20241004/bacteria \\
+        --ncbi_assembly_metadata /data/bi/references/bacteria/20240626/assembly_summary_refseq.txt \\
+        --prokka_args '--gram +' \\
         -resume
 
 EOF
 
 echo "sbatch assembly.sbatch" > _01_nf_assembly.sh
-
-
diff --git a/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config b/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config
index 04dddf4db..480d57f4a 100644
--- a/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config
+++ b/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config
@@ -228,4 +228,20 @@ process {
             ]
         ]
     }
+    withName: '.*:.*:FASTQ_TRIM_FASTP_FASTQC:FASTQC_RAW' {
+        maxRetries = 2
+        memory = {12.GB * task.attempt}
+    }
+    withName:KMERFINDER{
+        maxRetries = 2
+        memory = {12.GB * task.attempt}
+    }
+    withName: '.*:.*:FASTQ_TRIM_FASTP_FASTQC:FASTQC_TRIM' {
+        maxRetries = 2
+        memory = {12.GB * task.attempt}
+    }
+    withName: '.*:.*:UNICYCLER' {
+        maxRetries = 2
+        memory = {32.GB * task.attempt}
+    }
 }

From c3ec911c95de03135518eb1bbe1e470942425ba3 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 4 Jul 2024 09:24:33 +0200
Subject: [PATCH 080/321] Fixed minor mistakes in the lablog file

---
 .../assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog          | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog b/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
index 6124ca630..a196cc46d 100644
--- a/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
+++ b/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
@@ -112,16 +112,16 @@ nextflow run /data/bi/pipelines/nf-core-bacass/nf-core-bacass-2.3.1/main.nf \\
         -profile singularity \\
         --input samplesheet.csv \\
         --outdir ./ \\
-        --assembly_type short \\
-        --assembler unicycler \\
+        --assembly_type ${ASSEMBLY_MODE} \\
+        --assembler ${ASSEMBLER} \\
         --skip_polish true \\
-        --save_trimmed false \\
+        --save_trimmed ${SAVETRIMMED} \\
         --fastp_args '--qualified_quality_phred 20 --cut_mean_quality 20' \\
         --skip_kraken2 true \\
         --skip_kmerfinder false \\
         --kmerfinderdb /data/bi/references/kmerfinder/20241004/bacteria \\
         --ncbi_assembly_metadata /data/bi/references/bacteria/20240626/assembly_summary_refseq.txt \\
-        --prokka_args '--gram +' \\
+        ${PROKKA_ARGS} \\
         -resume
 
 EOF

From aa9296574256fdfa2acd703b3deb0f930426881c Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 4 Jul 2024 09:27:21 +0200
Subject: [PATCH 081/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index abaf2f21a..253b5add6 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -51,6 +51,7 @@ Code contributions to the new version:
 - Added MAG tempalte and removed MAG from other templates [#288](https://github.com/BU-ISCIII/buisciii-tools/pull/288)
 - Added amrfinderplus to characterization template. [#289] (https://github.com/BU-ISCIII/buisciii-tools/pull/289)
 - Updated all files so that paths referring to /pipelines/ are updated according to the new structure [#287](https://github.com/BU-ISCIII/buisciii-tools/pull/287)
+- Updated assembly's template (lablog and config files) [#295](https://github.com/BU-ISCIII/buisciii-tools/pull/295)
 
 ### Modules
 

From 9242e86019d3f7d523e9cfaa48e5ada231d32d5b Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 4 Jul 2024 11:05:58 +0200
Subject: [PATCH 082/321] Updated ariba's lablog

---
 .../ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/run/lablog  | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/run/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/run/lablog
index 9ddf07267..1bfc20c02 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/run/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/run/lablog
@@ -9,8 +9,8 @@ join -j 2 ../../samples_id.txt ../databases.txt | sed 's/^ //g' > sample_databas
 
 # col 1 (arr[0]): sample
 # col 2 (arr[1]): database
-cat sample_database.txt | grep -v 'pubmlst' | while read in; do arr=($in); echo "mkdir -p ${arr[0]}; srun --chdir $scratch_dir --output logs/ARIBA_${arr[0]}_${arr[1]}.%j.log --job-name ARIBA_${arr[0]}_${arr[1]} --cpus-per-task 5 --mem 5G --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../../ -B /data/bi/references/ariba/20211216/${arr[1]}/ /data/bi/pipelines/singularity-images/ariba:2.14.6--py36h4aaaa08_3 ariba run /data/bi/references/ariba/20211216/${arr[1]}/out.${arr[1]}.prepareref ${scratch_dir}/../../01-preprocessing/${arr[0]}/${arr[0]}_R1_filtered.fastq.gz ${scratch_dir}/../../01-preprocessing/${arr[0]}/${arr[0]}_R2_filtered.fastq.gz ${scratch_dir}/${arr[0]}/out_${arr[1]}_${arr[0]}_run &"; done > _01_ariba.sh
+cat sample_database.txt | grep -v 'pubmlst' | while read in; do arr=($in); echo "mkdir -p ${arr[0]}; srun --chdir $scratch_dir --output logs/ARIBA_${arr[0]}_${arr[1]}.%j.log --job-name ARIBA_${arr[0]}_${arr[1]} --cpus-per-task 5 --mem 5G --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../../ -B /data/bi/references/ariba/ /data/bi/pipelines/singularity-images/ariba:2.14.6--py39heaaa4ec_6 ariba run /data/bi/references/ariba/latest/${arr[1]}/out.${arr[1]}.prepareref ${scratch_dir}/../../01-preprocessing/${arr[0]}/${arr[0]}_R1_filtered.fastq.gz ${scratch_dir}/../../01-preprocessing/${arr[0]}/${arr[0]}_R2_filtered.fastq.gz ${scratch_dir}/${arr[0]}/out_${arr[1]}_${arr[0]}_run &"; done > _01_ariba.sh
 
-cat ../../../samples_id.txt | while read in; do echo "mkdir -p $in; srun --chdir $scratch_dir --output logs/ARIBA_${in}_pubmlst.%j.log --job-name ARIBA_${in}_pubmlst --cpus-per-task 5 --mem 5G --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../../ /data/bi/pipelines/singularity-images/ariba:2.14.6--py36h4aaaa08_3 ariba run ${scratch_dir}/${downloaded_ref} ${scratch_dir}/../../01-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../../01-preprocessing/${in}/${in}_R2_filtered.fastq.gz ${scratch_dir}/${in}/out_pubmlst_${in}_run &"; done > _01_ariba.sh
+cat ../../../samples_id.txt | while read in; do echo "mkdir -p $in; srun --chdir $scratch_dir --output logs/ARIBA_${in}_pubmlst.%j.log --job-name ARIBA_${in}_pubmlst --cpus-per-task 5 --mem 5G --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../../ /data/bi/pipelines/singularity-images/ariba:2.14.6--py39heaaa4ec_6 ariba run ${scratch_dir}/${downloaded_ref} ${scratch_dir}/../../01-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../../01-preprocessing/${in}/${in}_R2_filtered.fastq.gz ${scratch_dir}/${in}/out_pubmlst_${in}_run &"; done >> _01_ariba.sh
 
 cat sample_database.txt | while read in; do arr=($in); echo "mv ${arr[0]}/out_${arr[1]}_${arr[0]}_run/report.tsv ${arr[0]}/out_${arr[1]}_${arr[0]}_run/${arr[0]}_${arr[1]}_report.tsv"; done > _02_fix_tsvreport.sh

From ac13addae41444c75ea132bb75284520118c7a71 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 4 Jul 2024 11:39:57 +0200
Subject: [PATCH 083/321] Fixed minor mistakes in the config file

---
 .../assembly/DOC/hpc_slurm_assembly.config    | 27 +++++++------------
 1 file changed, 10 insertions(+), 17 deletions(-)

diff --git a/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config b/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config
index 480d57f4a..284208fbb 100644
--- a/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config
+++ b/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config
@@ -38,6 +38,8 @@ params {
 params { publish_dir_mode = 'copy' }
 process {
 	withName: '.*:.*:FASTQ_TRIM_FASTP_FASTQC:FASTQC_RAW' {
+		maxRetries = 2
+        	memory = {12.GB * task.attempt}
 		publishDir = [
 			[
                 path: { "${params.outdir}/01-processing/fastqc/raw" },
@@ -71,6 +73,8 @@ process {
 		]
 	}
 	withName: '.*:.*:FASTQ_TRIM_FASTP_FASTQC:FASTQC_TRIM' {
+		maxRetries = 2
+        	memory = {12.GB * task.attempt}
 		publishDir = [
 			[
                 path: { "${params.outdir}/01-processing/fastqc/trim" },
@@ -127,6 +131,9 @@ process {
         ]
     }
 	withName: '.*:.*:KMERFINDER_SUBWORKFLOW:KMERFINDER' {
+		maxRetries = 2
+        	memory = {12.GB * task.attempt}
+        	errorStrategy = { task.exitStatus in [1] ? 'retry' : 'finish'}
 		publishDir = [
             path: { "${params.outdir}/02-taxonomy_contamination/kmerfinder/${meta.id}" },
             mode: params.publish_dir_mode
@@ -145,7 +152,9 @@ process {
         ]
     }
     withName: 'UNICYCLER|CANU|MINIASM|DRAGONFLYE' {
-        publishDir = [
+        maxRetries = 2
+        memory = {64.GB * task.attempt}
+	publishDir = [
             path: { "${params.outdir}/03-assembly/${params.assembler}" },
             mode: params.publish_dir_mode,
             saveAs: { filename ->
@@ -228,20 +237,4 @@ process {
             ]
         ]
     }
-    withName: '.*:.*:FASTQ_TRIM_FASTP_FASTQC:FASTQC_RAW' {
-        maxRetries = 2
-        memory = {12.GB * task.attempt}
-    }
-    withName:KMERFINDER{
-        maxRetries = 2
-        memory = {12.GB * task.attempt}
-    }
-    withName: '.*:.*:FASTQ_TRIM_FASTP_FASTQC:FASTQC_TRIM' {
-        maxRetries = 2
-        memory = {12.GB * task.attempt}
-    }
-    withName: '.*:.*:UNICYCLER' {
-        maxRetries = 2
-        memory = {32.GB * task.attempt}
-    }
 }

From e0d1c30ddbf6db2ecedf48875a30ac497d25dca8 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 4 Jul 2024 11:41:01 +0200
Subject: [PATCH 084/321] Replaced kmerfinder database for latest

---
 .../templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog      | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog b/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
index a196cc46d..38f5edd7a 100644
--- a/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
+++ b/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
@@ -119,7 +119,7 @@ nextflow run /data/bi/pipelines/nf-core-bacass/nf-core-bacass-2.3.1/main.nf \\
         --fastp_args '--qualified_quality_phred 20 --cut_mean_quality 20' \\
         --skip_kraken2 true \\
         --skip_kmerfinder false \\
-        --kmerfinderdb /data/bi/references/kmerfinder/20241004/bacteria \\
+        --kmerfinderdb /data/bi/references/kmerfinder/latest/bacteria \\
         --ncbi_assembly_metadata /data/bi/references/bacteria/20240626/assembly_summary_refseq.txt \\
         ${PROKKA_ARGS} \\
         -resume

From a0d054a3e26500523a8be4eacd00d9cbea50db31 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 4 Jul 2024 11:43:43 +0200
Subject: [PATCH 085/321] Updated amrfinderplus lablog

---
 .../ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog   | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog
index a75150202..a8694b065 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog
@@ -4,6 +4,8 @@
 
 scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
 
+mkdir logs	
+
 possible_organisms=("Acinetobacter_baumannii" "Burkholderia_cepacia" "Burkholderia_pseudomallei" "Campylobacter" "Citrobacter_freundii" "Clostridioides_difficile" "Enterobacter_asburiae" "Enterobacter_cloacae" "Enterococcus_faecalis" "Enterococcus_faecium" "Escherichia" "Klebsiella_oxytoca" "Klebsiella_pneumoniae" "Neisseria_gonorrhoeae" "Neisseria_meningitidis" "Pseudomonas_aeruginosa" "Salmonella" "Serratia_marcescens" "Staphylococcus_aureus" "Staphylococcus_pseudintermedius" "Streptococcus_agalactiae" "Streptococcus_pneumoniae" "Streptococcus_pyogenes" "Vibrio_cholerae" "Vibrio_parahaemolyticus" "Vibrio_vulnificus" "OTHER")
 echo
 echo -e "\n\033[1;37mPlease select your bacteria from the following list:\033[0m"
@@ -12,12 +14,12 @@ select bacteria in "${possible_organisms[@]}"; do
     if [[ -n "$bacteria" ]]; then
         echo -e "\033[0;32mOrganism selected: ${bacteria}\033[0m"
         if [ $bacteria = "OTHER" ]; then
-            cat ../samples_id.txt | while read in; do echo "srun --chdir $scratch_dir --partition middle_idx amrfinder -n $(ls ../../*ANALYSIS*ASSEMBLY/03-assembly/unicycler/${in}.fasta.gz)  --name ${in} --plus -o ${in}_out.tsv &" >> _01_run_amrfinder.sh; done
+            cat ../samples_id.txt | while read in; do echo "srun --chdir $scratch_dir --partition middle_idx --output logs/AMRFINDER_${in}.%j.log --job-name AMRFINDER_${in} amrfinder -n $(ls ../../*ANALYSIS*ASSEMBLY/03-assembly/unicycler/${in}.fasta.gz)  --name ${in} --plus -o ${in}_out.tsv &" >> _01_run_amrfinder.sh; done
         else
-            cat ../samples_id.txt | while read in; do echo "srun --chdir $scratch_dir --partition middle_idx amrfinder -n $(ls ../../*ANALYSIS*ASSEMBLY/03-assembly/unicycler/${in}.fasta.gz)  --organism ${bacteria} --name ${in} --plus -o ${in}_out.tsv &" >> _01_run_amrfinder.sh; done
+            cat ../samples_id.txt | while read in; do echo "srun --chdir $scratch_dir --partition middle_idx --output logs/AMRFINDER_${in}.%j.log --job-name AMRFINDER_${in} amrfinder -n $(ls ../../*ANALYSIS*ASSEMBLY/03-assembly/unicycler/${in}.fasta.gz)  --organism ${bacteria} --name ${in} --plus -o ${in}_out.tsv &" >> _01_run_amrfinder.sh; done
         fi
         break
     else
         echo -e "\n\033[0;31mInvalid input.\033[0m"
     fi
-done
\ No newline at end of file
+done

From 10141026c71dc13ebf605b66ad47f5d51ede3711 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 4 Jul 2024 12:42:21 +0200
Subject: [PATCH 086/321] Updated snippy lablog

---
 .../snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog
index 95826e287..c67c2a06d 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog
@@ -1,4 +1,4 @@
-rm # module load singularity
+# conda activate snippy
 
 scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
 
@@ -6,10 +6,10 @@ mkdir logs
 
 cat ../samples_id.txt | while read in; do echo -e "${in}\t${scratch_dir}/../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz\t${scratch_dir}/../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz"; done >> input.tab
 
-ls ${scratch_dir}/../../../REFERENCES | xargs -I %% singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_2 snippy-multi ${scratch_dir}/input.tab --mincov 9 --mapqual 10 --basequal 5 --minqual 30 --ref ${scratch_dir}/../../../REFERENCES/%% --cpus 5 > commands.out
+singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 snippy-multi ${scratch_dir}/input.tab --mincov 9 --mapqual 10 --basequal 5 --minqual 30 --ref ${scratch_dir}/../../../REFERENCES/GCF_015326295.1/GCF_015326295.1_ASM1532629v1_genomic.fna --cpus 5 > commands.out
 
-head -n -1 commands.out | sed -e "s@^@srun --chdir ${scratch_dir} --output logs/SNIPPY.%j.log --job-name SNIPPY --cpus-per-task 5 --mem 49152 --partition short_idx --time 02:00:00 @" | awk '{print $0" &"}' > _00_snippy.sh
-tail -n 1 commands.out | sed -e "s@^@srun --chdir ${scratch_dir} --output logs/SNIPPY_CORE.%j.log --job-name SNIPPY --cpus-per-task 5 --mem 49152 --partition short_idx --time 02:00:00 @" | awk '{print $0" &"}' > _01_snippy_core.sh
+head -n -1 commands.out | sed -e "s@^@srun --chdir ${scratch_dir} --output logs/SNIPPY.%j.log --job-name SNIPPY --cpus-per-task 5 --mem 49152 --partition short_idx --time 02:00:00 env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 @" | awk '{print $0" &"}' > _00_snippy.sh
+tail -n 1 commands.out | sed -e "s@^@srun --chdir ${scratch_dir} --output logs/SNIPPY_CORE.%j.log --job-name SNIPPY --cpus-per-task 5 --mem 49152 --partition short_idx --time 02:00:00 env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 @" | awk '{print $0" &"}' > _01_snippy_core.sh
 
 
 
@@ -19,7 +19,7 @@ tail -n 1 commands.out | sed -e "s@^@srun --chdir ${scratch_dir} --output logs/S
 # echo "grep \"complex\" ./*/snps.vcf | cut -f 1,2,4,5 | cut -d \":\" -f 2 | sort -u | awk '{pos1=\$2; len_ref=length(\$3); printf \"%s\t%s\t%s\n\", \$1, pos1-1, pos1+len_ref+1}' | grep -v \"^#\" > mask_complex_variants.bed" > _01_snippy_core.sh
 # ls ${scratch_dir}/../../../REFERENCES | xargs -I %% echo "snippy-core --debug --mask ./mask_complex_variants.bed --mask-char 'N' --ref '../../../REFERENCES/%%' $(cat ../samples_id.txt | xargs)" >> _01_snippy_core.sh
 
-echo "snp-sites -b -c -o phylo.aln core.full.aln" > _02_phylo_aln.sh
+echo "srun --chdir ${scratch_dir} --output logs/SNIP-SITES.%j.log --job-name SNIP-SITES --cpus-per-task 5 --mem 49152 --partition short_idx --time 02:00:00 env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 snp-sites -b -c -o phylo.aln core.full.aln &" > _02_phylo_aln.sh
 
 # awk 'BEGIN{FS="[> ]"} /^>/{val=$2;next}  {print val,length($0)}' phylo.aln
 

From 338997b011560611446ea965899d3e8de5441655 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 4 Jul 2024 12:49:17 +0200
Subject: [PATCH 087/321] Updated services.json

---
 bu_isciii/templates/services.json | 17 -----------------
 1 file changed, 17 deletions(-)

diff --git a/bu_isciii/templates/services.json b/bu_isciii/templates/services.json
index 7463cd5c4..3107c913f 100755
--- a/bu_isciii/templates/services.json
+++ b/bu_isciii/templates/services.json
@@ -16,23 +16,6 @@
         "delivery_md": "assets/reports/md/assembly.md",
         "results_md": "assets/reports/results/assembly.md"
     },
-    "mtbseq_assembly": {
-        "label": "",
-        "template": "mtbseq",
-        "order": 1,
-        "begin": "base",
-        "end": "mag_met",
-        "url": "https://github.com/ngs-fzb/MTBseq_source",
-        "description": "Mycobacterium tuberculosis mapping, variant calling and detection of resistance using MTBseq",
-        "clean": {
-          "folders":["Bam", "Mpileup"],
-          "files":["01-processing/fastp/sample_name_1.fastp.fastq.gz", "01-processing/fastp/sample_name_2.fastp.fastq.gz"]
-        },
-        "no_copy": ["RAW", "TMP"],
-        "last_folder":"REFERENCES",
-        "delivery_md": "",
-        "results_md": ""
-    },
     "mtbseq": {
         "label": "",
         "template": "mtbseq",

From 8abcc989a32427e7248e6ac1fc7ce9aedda62687 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 4 Jul 2024 12:50:06 +0200
Subject: [PATCH 088/321] Removed genomeev and mtbseq_assembly templates

---
 .../ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog      |  38 -----
 .../ANALYSIS/ANALYSIS03_MAG/99-stats/lablog   |  25 ----
 .../99-stats/multiqc_config.yaml              |  13 --
 .../genomeev/ANALYSIS/ANALYSIS03_MAG/lablog   |  30 ----
 .../genomeev/ANALYSIS/ANALYSIS04_BLAST/lablog |  75 ----------
 bu_isciii/templates/genomeev/ANALYSIS/README  |  25 ----
 .../ANALYSIS/_02_create_run_percentage_Ns.sh  |   1 -
 .../genomeev/ANALYSIS/create_assembly_stats.R | 130 ------------------
 .../ANALYSIS/create_summary_report.sh         |  51 -------
 .../ANALYSIS/deduplicate_long_table.sh        |   6 -
 .../genomeev/ANALYSIS/lablog_pikavirus        |   4 -
 .../genomeev/ANALYSIS/lablog_viralrecon       |  68 ---------
 .../genomeev/ANALYSIS/percentajeNs.py         |  21 ---
 .../genomeev/ANALYSIS/samples_ref.txt         |   4 -
 .../genomeev/DOC/hpc_slurm_pikavirus.config   |  32 -----
 bu_isciii/templates/genomeev/DOC/mag.config   |  19 ---
 .../DOC/viralrecon_metagenomic.config         |  19 ---
 ...con_metagenomic_ignore_merge_codons.config |  42 ------
 .../DOC/viralrecon_metagenomic_params.yml     |  11 --
 .../viralrecon_metagenomic_save_nohost.config |  40 ------
 bu_isciii/templates/genomeev/RAW/README       |   1 -
 .../genomeev/RESULTS/lablog_genomeev_results  |  17 ---
 bu_isciii/templates/genomeev/TMP/README       |   1 -
 .../ANALYSIS/ANALYSIS01_ASSEMBLY/lablog       |  37 -----
 .../ANALYSIS/ANALYSIS02_MTBSEQ/lablog         |  21 ---
 .../ANALYSIS02_MTBSEQ/samples_all/lablog      |  22 ---
 .../templates/mtbseq_assembly/ANALYSIS/lablog |   6 -
 .../templates/mtbseq_assembly/DOC/README      |   1 -
 .../DOC/hpc_slurm_assembly.config             |  27 ----
 .../templates/mtbseq_assembly/RAW/README      |   1 -
 .../mtbseq_assembly/REFERENCES/README         |   1 -
 .../templates/mtbseq_assembly/RESULTS/README  |   1 -
 .../RESULTS/lablog_mtbseq_assembly_results    |   9 --
 .../templates/mtbseq_assembly/TMP/README      |   1 -
 34 files changed, 800 deletions(-)
 delete mode 100644 bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog
 delete mode 100644 bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS03_MAG/99-stats/lablog
 delete mode 100644 bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS03_MAG/99-stats/multiqc_config.yaml
 delete mode 100644 bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS03_MAG/lablog
 delete mode 100644 bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS04_BLAST/lablog
 delete mode 100644 bu_isciii/templates/genomeev/ANALYSIS/README
 delete mode 100644 bu_isciii/templates/genomeev/ANALYSIS/_02_create_run_percentage_Ns.sh
 delete mode 100644 bu_isciii/templates/genomeev/ANALYSIS/create_assembly_stats.R
 delete mode 100644 bu_isciii/templates/genomeev/ANALYSIS/create_summary_report.sh
 delete mode 100644 bu_isciii/templates/genomeev/ANALYSIS/deduplicate_long_table.sh
 delete mode 100644 bu_isciii/templates/genomeev/ANALYSIS/lablog_pikavirus
 delete mode 100644 bu_isciii/templates/genomeev/ANALYSIS/lablog_viralrecon
 delete mode 100644 bu_isciii/templates/genomeev/ANALYSIS/percentajeNs.py
 delete mode 100644 bu_isciii/templates/genomeev/ANALYSIS/samples_ref.txt
 delete mode 100644 bu_isciii/templates/genomeev/DOC/hpc_slurm_pikavirus.config
 delete mode 100644 bu_isciii/templates/genomeev/DOC/mag.config
 delete mode 100644 bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic.config
 delete mode 100644 bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic_ignore_merge_codons.config
 delete mode 100644 bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic_params.yml
 delete mode 100644 bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic_save_nohost.config
 delete mode 100644 bu_isciii/templates/genomeev/RAW/README
 delete mode 100644 bu_isciii/templates/genomeev/RESULTS/lablog_genomeev_results
 delete mode 100644 bu_isciii/templates/genomeev/TMP/README
 delete mode 100644 bu_isciii/templates/mtbseq_assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
 delete mode 100644 bu_isciii/templates/mtbseq_assembly/ANALYSIS/ANALYSIS02_MTBSEQ/lablog
 delete mode 100644 bu_isciii/templates/mtbseq_assembly/ANALYSIS/ANALYSIS02_MTBSEQ/samples_all/lablog
 delete mode 100644 bu_isciii/templates/mtbseq_assembly/ANALYSIS/lablog
 delete mode 100644 bu_isciii/templates/mtbseq_assembly/DOC/README
 delete mode 100644 bu_isciii/templates/mtbseq_assembly/DOC/hpc_slurm_assembly.config
 delete mode 100644 bu_isciii/templates/mtbseq_assembly/RAW/README
 delete mode 100644 bu_isciii/templates/mtbseq_assembly/REFERENCES/README
 delete mode 100644 bu_isciii/templates/mtbseq_assembly/RESULTS/README
 delete mode 100644 bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results
 delete mode 100644 bu_isciii/templates/mtbseq_assembly/TMP/README

diff --git a/bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog b/bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog
deleted file mode 100644
index 7a8120a75..000000000
--- a/bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog
+++ /dev/null
@@ -1,38 +0,0 @@
-# module load Nextflow/21.10.6 singularity
-
-ln -s ../00-reads .
-ln -s ../samples_id.txt .
-echo "sample,fastq_1,fastq_2" > samplesheet.csv
-cat samples_id.txt | while read in; do echo "${in},00-reads/${in}_R1.fastq.gz,00-reads/${in}_R2.fastq.gz"; done >> samplesheet.csv
-
-
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-
-cat <<EOF > pikavirus.sbatch
-#!/bin/sh
-#SBATCH --ntasks 1
-#SBATCH --cpus-per-task 2
-#SBATCH --mem 4G
-#SBATCH --time 4:00:00
-#SBATCH --partition middle_idx
-#SBATCH --output $(date '+%Y%m%d')_pikavirus01.log
-#SBATCH --chdir $scratch_dir
-
-export NXF_OPTS="-Xms500M -Xmx4G"
-
-nextflow run /scratch/bi/pipelines/PikaVirus/main.nf \\
-          -c ../../DOC/hpc_slurm_pikavirus.config \\
-          --input samplesheet.csv \\
-          --kraken_scouting false \\
-          --virus true \\
-          --bacteria false \\
-          --fungi false \\
-          --kaiju false \\
-          --mash_winner_strategy true \\
-          --mash_identitity_threshold 0.9 \\
-          --mash_shared_hashes_threshold 0.01 \\
-          --mash_pvalue_threshold 0.05 \\
-          -resume
-EOF
-
-echo "sbatch pikavirus.sbatch" > _01_nf_pikavirus.sh
\ No newline at end of file
diff --git a/bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS03_MAG/99-stats/lablog b/bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS03_MAG/99-stats/lablog
deleted file mode 100644
index 88edff156..000000000
--- a/bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS03_MAG/99-stats/lablog
+++ /dev/null
@@ -1,25 +0,0 @@
-# module load singularity
-
-cat ../../samples_id.txt | while read in; do ln -s ../*_mag/Taxonomy/kraken2/${in}/kraken2_report.txt ./${in}_kraken2_report.txt; done
-
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-
-cat <<EOF > multiqc.sbatch
-#!/bin/sh
-#SBATCH --ntasks 1
-#SBATCH --cpus-per-task 2
-#SBATCH --mem 4G
-#SBATCH --time 00:30:00
-#SBATCH --partition short_idx
-#SBATCH --output $(date '+%Y%m%d')_multiqc.log
-#SBATCH --chdir $scratch_dir
-
-export NXF_OPTS="-Xms500M -Xmx4G"
-
-singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/multiqc:1.9--py_1 multiqc -d . --config multiqc_config.yaml
-
-EOF
-
-echo "sbatch multiqc.sbatch" > _01_run_multiqc.sh
-
-echo "find -type l | while read in; do unlink \${in}; done" > _02_unlink.sh
diff --git a/bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS03_MAG/99-stats/multiqc_config.yaml b/bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS03_MAG/99-stats/multiqc_config.yaml
deleted file mode 100644
index 96b7e6136..000000000
--- a/bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS03_MAG/99-stats/multiqc_config.yaml
+++ /dev/null
@@ -1,13 +0,0 @@
-extra_fn_clean_exts:
-    - _R1
-    - _R2
-    - .R1
-    - .R2
-    - .sort
-    - _sort
-    - .stats
-    - _bamstat
-    - _align
-    - .txt
-report_comment: >
-    This report has been generated by BU-ISCIII
diff --git a/bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS03_MAG/lablog b/bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS03_MAG/lablog
deleted file mode 100644
index 83e293d6f..000000000
--- a/bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS03_MAG/lablog
+++ /dev/null
@@ -1,30 +0,0 @@
-ln -s ../00-reads .
-ln -s ../samples_id.txt .
-
-#module load Nextflow
-#module load singularity
-
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-
-cat <<EOF > mag.sbatch
-#!/bin/sh
-#SBATCH --ntasks 1
-#SBATCH --cpus-per-task 2
-#SBATCH --mem 4G
-#SBATCH --time 2:00:00
-#SBATCH --partition middle_idx
-#SBATCH --output $(date '+%Y%m%d')_mag.log
-#SBATCH --chdir $scratch_dir
-
-export NXF_OPTS="-Xms500M -Xmx4G"
-
-nextflow run /data/bi/pipelines/nf-core-mag-2.1.1/workflow/main.nf \\
-          -c ../../DOC/mag.config \\
-          --input '00-reads/*_R{1,2}.fastq.gz' \\
-          --outdir $(date '+%Y%m%d')_mag \\
-          --kraken2_db /data/bi/references/kraken/minikraken_8GB_20200312.tgz \\
-          --skip_busco --skip_spades --skip_spadeshybrid --skip_megahit --skip_prodigal --skip_binning \\
-          -resume
-EOF
-
-echo "sbatch mag.sbatch" > _01_run_mag.sh
diff --git a/bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS04_BLAST/lablog b/bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS04_BLAST/lablog
deleted file mode 100644
index 2986a343d..000000000
--- a/bu_isciii/templates/genomeev/ANALYSIS/ANALYSIS04_BLAST/lablog
+++ /dev/null
@@ -1,75 +0,0 @@
-# module load singularity
-
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-mkdir logs
-
-# Location of assemblies to a variable so it only has to be changed here
-LOCATION=../*/*/assembly/*/*
-# Other databases: 
-# /data/bi/references/BLAST_dbs/nt_20211025/nt
-BLAST_DATABASE="/data/bi/references/virus/BLAST/all_virus.fasta"
-
-# if there are scaffolds, uncompress the scaffolds in its dir (zcat for decompression)
-# if there contigs and no scaffolds, uncompress the contigs as scaffolds in its dir
-echo "Samples that did not generate scaffolds:" > noscaffold.txt
-cat ../samples_id.txt | while read in; do
-    mkdir ${in}
-    # ls will return 0 if there are no scaffolds file
-    # NOTE: change extension and location at will
-    # NOTE2: zcat is only used in case of gzipped files, use a cp or ln -s if needed
-    if [ $(ls ${LOCATION}/${in}.scaffolds.fa.gz | wc -l) != 0 ]; then
-        zcat ${LOCATION}/${in}.scaffolds.fa.gz > ${in}/${in}.scaffolds.fa
-    else
-        # Note assemblies that did not make a scaffold
-        zcat ${LOCATION}/${in}.contigs.fa.gz > ${in}/${in}.scaffolds.fa
-        echo ${in} >> noscaffold.txt
-    fi
-done 
-
-# NOTE3: change the -query flag to meet your requirements
-cat ../samples_id.txt | xargs -I %% echo "srun --chdir ${scratch_dir} --partition middle_idx --mem 200G --time 48:00:00 --cpus-per-task 10 --output logs/BLASTN_%%_%j.log --job-name BLASTN_%% singularity exec -B ${scratch_dir}/../../ -B /data/bi/references/virus/BLAST /data/bi/pipelines/singularity-images/blast:2.11.0--pl5262h3289130_1 blastn -num_threads 10 -db ${BLAST_DATABASE} -query ${scratch_dir}/%%/%%.scaffolds.fa -out ${scratch_dir}/%%/%%_blast.tsv -outfmt '6 qseqid stitle qaccver saccver pident length mismatch gaps qstart qend sstart send evalue bitscore slen qlen qcovs' &" > _01_blast.sh
-
-# Filtering criteria:
-    # %refCovered > 0.7
-    # ref not a phage (stitle ~! /phage/)
-    # ref longer than 200 bp (slen > 200)
-
-# First awk: create the full table; second awk: filter it
-cat ../samples_id.txt | xargs -I %% echo "awk -v \"samplename=%%\" 'BEGIN{OFS=\"\t\";FS=\"\t\"}{print samplename,\$0,(\$6-\$8)/\$16,\$6/\$15}' %%/%%_blast.tsv | awk 'BEGIN{OFS=\"\t\";FS=\"\t\"} \$16 > 200 && \$17 > 0.7 && \$3 !~ /phage/ {print \$0}' > %%/%%_blast_filt.tsv" > _02_filter_blast.sh
-echo -e "echo \"samplename\tqseqid\tstitle\tqaccver\tsaccver\tpident\tlength\tmismatch\tgap\tqstart\tqend\tsstart\tsend\tevalue\tbitscore\tref_len\tquery_len\tqcovs\t%queryAligned\t%refCovered\" > header" > _03_gather_results_add_header.sh
-echo "cat header */*blast_filt.tsv > all_samples_filtered_BLAST_results.tsv" >> _03_gather_results_add_header.sh
-cat ../samples_id.txt | xargs -I %% echo "cat header %%/%%_blast_filt.tsv > tmp; rm %%/%%_blast_filt.tsv; mv tmp %%/%%_blast_filt.tsv" >> _03_gather_results_add_header.sh
-echo "rm header" >> _03_gather_results_add_header.sh
-
-# NOTES FOR FILTERING
-#
-# subject = reference
-#
-# COLS GENERATED BY US:
-#  1: samplename
-# GENERATED BY BLAST
-#  2: contigname - qseqid
-#  3: stitle 
-#  4: qaccver
-#  5: saccver
-#  6: pident
-#  7: length (of alignment)
-#  8: mismatch
-#  9: gaps
-# 10: qstart
-# 11: qend
-# 12: sstart
-# 13: send
-# 14: evalue
-# 15: bitscore
-# 16: ref len - slen
-# 17: query len - qlen
-# 18: qcovs
-# MORE INFO: https://www.metagenomics.wiki/tools/blast/blastn-output-format-6
-# GENERATED BY US:
-# 19: %queryAligned: (length-gaps)/qlen (if gaps are not deleted, then this would be bigger than 1 sometimes)
-# 20: %refCovered: length/slen
-
-# conda activate 2excel
-cat ../samples_id.txt | xargs -I %% echo "srun --chdir ${scratch_dir} --partition short_idx --mem 10G --time 1:00:00 --output logs/2excel_%%.log --job-name 2excel_%% python /data/bi/pipelines/utilities/export_excel_from_csv.py --input_file %%/%%_blast_filt.tsv --delimiter '\t' --output_filename %%/%%_blast_filt --it_has_index --it_has_header" > _04_to_excel.sh
-echo "srun --chdir ${scratch_dir} --partition short_idx --mem 10G --time 1:00:00 --output logs/2excel_all.log --job-name 2excel_all python /data/bi/pipelines/utilities/export_excel_from_csv.py --input_file all_samples_filtered_BLAST_results.tsv --delimiter '\t' --output_filename all_samples_filtered_BLAST_results --it_has_index --it_has_header" >> _04_to_excel.sh
diff --git a/bu_isciii/templates/genomeev/ANALYSIS/README b/bu_isciii/templates/genomeev/ANALYSIS/README
deleted file mode 100644
index 0ecbe695b..000000000
--- a/bu_isciii/templates/genomeev/ANALYSIS/README
+++ /dev/null
@@ -1,25 +0,0 @@
-This document should be read as INSTRUCTIONS to perform the "genomeev" service, as created on 25 Sep 2023.
-The steps to follow to perform this service (which, by the way, can be done fairly quickly computationally speaking) are the following:
-
-- Load the samples into the RAW directory (manually or automatically using the BU-ISCIII tools)
-
-- Copy all files from this template (manually or automatically, make sure all files are there)
-
-- Copy the whole service folder to scratch_tmp (at least, we had to do that when this template was created)
-
-- First part is PikaVirus. Run PikaVirus by executing lablog_pikavirus, then enter the PikaVirus folder, execute the lablog (note that you need a samples_id.txt file, if you did not create it automatically, it has to be done manually), load the modules and do the thing. Feel free to change anything in PikaVirus through command or through the config (config is recommended so that any changes can be tracked). NOTE: wait for PikaVirus to end before you continue. Do something else in the meantime. read a paper or something dunno.
-
-- Once PikaVirus has ended, we have to dive into the results, particularly the "all_samples_virus_table.tsv" in the results dir. Here, we have to find the most abundant virus. I personally recommend opening this file in excel or similar, and find the virus that repeats the most in the samples using some formula such as "COUNTIF(range, value)". Make sure you are working with a genome and not with just a fragment of it.
-
-- Download said assembly locally, both its fna and its gff file. Make sure you store both files with the same name and different extension. The name SHOULD include the virus name, and the GCA/GCF code so its easier to identify (example: RotavirusG8_GCA_002669555_1.fasta; RotavirusG8_GCA_002669555_1.gff). Then, place it in the corresponding directory inside "/data/bi/references/virus".
-
-- Once the files have been placed, we have to modify the samples_ref.txt file. 
-    First column will be the exact same as the samples_id.txt file. 
-    Second column will be the name of the assemblies we downloaded in the previous step (example: RotavirusG8_GCA_002669555_1 ). Make sure that all the rows are the exact same.
-    Third column will be the name of the host (typically "human", but can be changed depending on the situation)
-
-- Execute the lablog_viralrecon. The ANALYSIS02 directory will be created and filled with the corresponding scripts. Load the modules and launch viralrecon.
-
-- Once it has ended, its time for MAG. Go to the ANALYSIS03 directory, execute the lablog, load the modules and run MAG with the specified params.
-
-- Last, but not least, go to the ANALYSIS04 directory and run the lablog, the lablog will check the assembly step in viralrecon, and will store the names of the samples that didnt assembly to the scaffold level in the noscaffold.txt file. Run normally the three scripts after loading the corresponding module, and that should be about everything there is to this service! 
diff --git a/bu_isciii/templates/genomeev/ANALYSIS/_02_create_run_percentage_Ns.sh b/bu_isciii/templates/genomeev/ANALYSIS/_02_create_run_percentage_Ns.sh
deleted file mode 100644
index 3e5e10128..000000000
--- a/bu_isciii/templates/genomeev/ANALYSIS/_02_create_run_percentage_Ns.sh
+++ /dev/null
@@ -1 +0,0 @@
-i=1; find */variants/ivar/consensus/ -type d -name 'bcftools' | while read in;  do echo "python ./percentajeNs.py ${in} %Ns_${i}.tab"; i=$((i+1)); done > _03_run_percentage_Ns.sh; echo "cat %Ns_* > %Ns.tab" >> _03_run_percentage_Ns.sh; echo "rm %Ns_*" >> _03_run_percentage_Ns.sh
diff --git a/bu_isciii/templates/genomeev/ANALYSIS/create_assembly_stats.R b/bu_isciii/templates/genomeev/ANALYSIS/create_assembly_stats.R
deleted file mode 100644
index d174e208f..000000000
--- a/bu_isciii/templates/genomeev/ANALYSIS/create_assembly_stats.R
+++ /dev/null
@@ -1,130 +0,0 @@
-#!/usr/bin/env Rscript
-
-################################################
-################################################
-## LOAD LIBRARIES                             ##
-################################################
-################################################
-
-library(plyr, quietly = TRUE, warn.conflicts = FALSE)
-library(dplyr, quietly = TRUE, warn.conflicts = FALSE)
-library(tidyr, quietly = TRUE, warn.conflicts = FALSE)
-library(stringr, quietly = TRUE, warn.conflicts = FALSE)
-library(jsonlite, quietly = TRUE, warn.conflicts = FALSE)
-library(writexl, quietly = TRUE, warn.conflicts = FALSE)
-
-################################################
-################################################
-## DATA          ###############################
-################################################
-################################################
-
-# PATHS
-path <- getwd()
-samples_ref <- read.table(paste0(path, "/samples_ref.txt"), header = F)
-
-if (ncol(samples_ref) == 2) {
-    colnames(samples_ref) <- c("id", "ref")
-} else {
-    colnames(samples_ref) <- c("id", "ref", "host")
-}
-
-# Fastq path
-
-fastq_names <- list.files("../../RAW/")
-path_run <- Sys.readlink(paste0("../../RAW/", fastq_names[1]))
-
-# columnas
-columnas <- "run\tuser\thost\tVirussequence\tsample\ttotalreads\treadshostR1\treadshost\t%readshost\tNon-host-reads\t%Non-host-reads\tContigs\tLargest_contig\t%Genome_fraction"
-name_columns <- as.vector(str_split(columnas, "\t", simplify = T))
-
-list_assembly <- list(0)
-for (i in 1:nrow(samples_ref)) {
-
-    # Run, user, host and sequence
-    name_run <- str_split(path_run, "/", simplify = T)[, 4]
-    name_user <- str_split(path, "_", simplify = T)[, 5]
-    name_host <- tolower(str_split(path, "_", simplify = T)[, 9])
-    date_service <- str_split(str_split(path, "_", simplify = T)[, 6], "/", simplify = T)[, 3]
-
-    name_sequence <- as.character(samples_ref$ref[i])
-    name_id <- as.character(samples_ref$id[i])
-
-    # path outputfolder
-    directorios <- list.dirs(recursive = FALSE)
-    patron_workdir <- paste0(name_sequence, "_", date_service)
-    workdir <- directorios[grepl(patron_workdir, directorios)][1]
-
-    # totalreads
-    json_fastp <- fromJSON(paste0(workdir, "/fastp/", name_id, ".fastp.json"))
-    value_totalreads <- json_fastp$summary[["after_filtering"]]$total_reads
-
-    # readshostR1
-    table_kraken <- read.table(paste0(workdir, "/kraken2/", name_id, ".kraken2.report.txt"), sep = "\t")
-    unclassified_reads <- as.numeric(subset(x = table_kraken, subset = V6 == "unclassified")[2])
-    value_readhostr1 <- sum(table_kraken$V3)-unclassified_reads
-
-    # readshosh
-    value_readhost <- value_readhostr1 * 2
-
-    # readshost
-    value_percreadhost <- round((value_readhost * 100) / value_totalreads, 2)
-
-    # non host reads
-    value_nonhostreads <- value_totalreads - value_readhost
-
-    # % non host
-    value_percnonhostreads <- round((value_nonhostreads * 100) / value_totalreads, 2)
-    
-    # Contigs
-    assembly_workdir <- paste(workdir, "/assembly", sep = "")
-    quast_report_path <- paste("/",list.files(pattern = "transposed_report.tsv", recursive = TRUE, path = assembly_workdir), sep = "")
-    table_quast <- read.delim(paste0(assembly_workdir, quast_report_path), skip = 0, header = T, sep = "\t")
-
-    # no quast error
-    if (exists("table_quast") == FALSE) {
-        value_contigs <- NA
-        value_lcontig <- NA
-        value_genomef <- NA
-    } else {
-
-        sample_data <- subset(table_quast, Assembly == paste(name_id, "scaffolds", sep = "."))
-        value_contigs <- as.numeric(sample_data$X..contigs)
-        value_lcontig <- as.numeric(sample_data$Largest.contig)
-        value_genomef <- as.numeric(as.character(sample_data$Genome.fraction....))
-        
-        # empty values
-        # empty values
-        if (length(value_contigs) == 0) {
-            value_contigs <- NA
-        }
-
-        if (length(value_lcontig) == 0) {
-            value_lcontig <- NA
-        }
-
-        if (length(value_genomef) == 0) {
-            value_genomef <- NA
-        }
-    }
-
-    # Create table
-    list_assembly[[i]] <- c(name_run, name_user, name_host, name_sequence, name_id, value_totalreads, value_readhostr1, value_readhost, value_percreadhost, value_nonhostreads, value_percnonhostreads, value_contigs, value_lcontig, value_genomef)
-}
-
-df_final <- as.data.frame(do.call("rbind", list_assembly))
-colnames(df_final) <- name_columns
-
-# characters
-columnas_ch <- as.vector(1:5)
-df_final[, columnas_ch] <- apply(df_final[, columnas_ch], 2, function(x) as.character(x))
-
-# numeric
-columnas_nu <- as.vector(6:length(colnames(df_final)))
-df_final[, columnas_nu] <- apply(df_final[, columnas_nu], 2, function(x) as.numeric(as.character(x)))
-
-# Write table csv
-write.table(df_final, "assembly_stats.csv", row.names = F, col.names = T, sep = "\t", quote = F)
-
-# Write table xlsx
-write_xlsx(df_final, "assembly_stats.xlsx", format_headers = F)
diff --git a/bu_isciii/templates/genomeev/ANALYSIS/create_summary_report.sh b/bu_isciii/templates/genomeev/ANALYSIS/create_summary_report.sh
deleted file mode 100644
index 4ed9b1929..000000000
--- a/bu_isciii/templates/genomeev/ANALYSIS/create_summary_report.sh
+++ /dev/null
@@ -1,51 +0,0 @@
-#!/bin/bash
-
-# Define fixed data variables
-RUN=$(ls -l ../../RAW/ | cut -d'/' -f4 | sort -u | grep -v 'total' | head -n1 | rev | cut -d " " -f 2- | rev)
-USER=$(pwd | cut -d '/' -f6 | cut -d '_' -f4)
-HOST=$(pwd | cut -d '/' -f8 | cut -d '_' -f4 | tr '[:upper:]' '[:lower:]' | sed 's/.*/\u&/')
-
-# Define header for output file
-HEADER="run\tuser\thost\tVirussequence\tsample\ttotalreads\treadshostR1\treadshost\t%readshost\treadsvirus\t%readsvirus\tunmappedreads\t%unmapedreads\tmedianDPcoveragevirus\tCoverage>10x(%)\tVariantsinconsensusx10\tMissenseVariants\t%Ns10x\tLineage\tread_length\tanalysis_date"
-
-# Print header to output file
-echo -e $HEADER > mapping_illumina_$(date '+%Y%m%d').tab
-
-# Loop through sample list and extract relevant data
-cat samples_ref.txt | while read in
-do
-    # Sample and virus reference names
-    arr=($in);
-
-    # Extract data for each column
-    total_reads=$(grep 'total_reads' ${arr[1]}*/fastp/${arr[0]}.fastp.json | head -n2 | tail -n1 | cut -d ':' -f2 | sed 's/,//g')
-
-    reads_hostR1=$(cat ${arr[1]}*/kraken2/${arr[0]}.kraken2.report.txt | grep -v 'unclassified' | cut -f3 | awk '{s+=$1}END{print s}')
-    reads_host_x2=$(echo $((reads_hostR1 * 2)) )
-    perc_mapped=$(echo $(awk -v v1=$total_reads -v v2=$reads_host_x2 'BEGIN {print (v2*100)/v1}') )
-
-    reads_virus=$(cat ${arr[1]}*/variants/bowtie2/samtools_stats/${arr[0]}.sorted.bam.flagstat | grep '+ 0 mapped' | cut -d ' ' -f1)
-    
-    unmapped_reads=$(echo $((total_reads - (reads_host_x2+reads_virus))) )
-    perc_unmapped=$(echo $(awk -v v1=$total_reads -v v2=$unmapped_reads  'BEGIN {print (v2/v1)*100}') )
-
-    n_count=$(cat %Ns.tab | grep -w ${arr[0]} | grep ${arr[1]} | cut -f2)
-
-    missense=$(LC_ALL=C awk -F, '{if($10 >= 0.75)print $0}' ${arr[1]}*/variants/ivar/variants_long_table.csv | grep ^${arr[0]}, | grep 'missense' | wc -l)
-
-    Ns_10x_perc=$(zcat ${arr[1]}*/variants/ivar/consensus/bcftools/${arr[0]}.filtered.vcf.gz | grep -v '^#' | wc -l)
-
-    lineage=$(cat ${arr[1]}*/variants/ivar/consensus/bcftools/pangolin/${arr[0]}.pangolin.csv | tail -n1 | cut -d ',' -f2)
-
-    metrics=$(cat ${arr[1]}*/multiqc/summary_variants_metrics_mqc.csv | grep ^${arr[0]},)
-    reads_virus_perc=$(echo "$metrics" | cut -d ',' -f5)
-    medianDPcov=$(echo "$metrics" | cut -d ',' -f8)
-    cov10x=$(echo "$metrics" | cut -d ',' -f10)
-
-    read_length=$(cat ${arr[1]}*/multiqc/multiqc_data/multiqc_fastqc.yaml | grep -A5 "${arr[0]}_1:$" | grep "Sequence length:" | tr "-" " " | rev | cut -d " " -f1 | rev)
-
-    analysis_date=$(date '+%Y%m%d')
-
-    # Introduce data row into output file
-    echo -e "${RUN}\t${USER}\t${HOST}\t${arr[1]}\t${arr[0]}\t$total_reads\t$reads_hostR1\t$reads_host_x2\t$perc_mapped\t$reads_virus\t$reads_virus_perc\t$unmapped_reads\t$perc_unmapped\t$medianDPcov\t$cov10x\t$Ns_10x_perc\t$missense\t$n_count\t$lineage\t$read_length\t$analysis_date" >> mapping_illumina_$(date '+%Y%m%d').tab
-done
diff --git a/bu_isciii/templates/genomeev/ANALYSIS/deduplicate_long_table.sh b/bu_isciii/templates/genomeev/ANALYSIS/deduplicate_long_table.sh
deleted file mode 100644
index 146f23efb..000000000
--- a/bu_isciii/templates/genomeev/ANALYSIS/deduplicate_long_table.sh
+++ /dev/null
@@ -1,6 +0,0 @@
-find . -type f -name "variants_long_table.csv" | cut -d '/' -f1,2,3,4 | while read in
-do
-    mv ${in}/variants_long_table.csv ${in}/variants_long_table_dups.csv
-    head -n1 ${in}/variants_long_table_dups.csv > ${in}/variants_long_table.csv
-    grep -v 'SAMPLE' ${in}/variants_long_table_dups.csv | sort -u >> ${in}/variants_long_table.csv
-done
diff --git a/bu_isciii/templates/genomeev/ANALYSIS/lablog_pikavirus b/bu_isciii/templates/genomeev/ANALYSIS/lablog_pikavirus
deleted file mode 100644
index 04924688f..000000000
--- a/bu_isciii/templates/genomeev/ANALYSIS/lablog_pikavirus
+++ /dev/null
@@ -1,4 +0,0 @@
-mkdir -p 00-reads
-mv ANALYSIS01_PIKAVIRUS $(date '+%Y%m%d')_ANALYSIS01_PIKAVIRUS
-cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R1*.fastq.gz %_R1.fastq.gz" | bash; cd -
-cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R2*.fastq.gz %_R2.fastq.gz" | bash; cd -
\ No newline at end of file
diff --git a/bu_isciii/templates/genomeev/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/genomeev/ANALYSIS/lablog_viralrecon
deleted file mode 100644
index fc2a53206..000000000
--- a/bu_isciii/templates/genomeev/ANALYSIS/lablog_viralrecon
+++ /dev/null
@@ -1,68 +0,0 @@
-ANALYSIS_TYPE=METAGENOMIC
-CONFIG_FILE="../../DOC/viralrecon_metagenomic.config"
-PARAMS_FILE="../../DOC/viralrecon_metagenomic_params.yml"
-
-cat samples_ref.txt | cut -f3 | sort -u | while read in; do echo ${in^^}; done > host_list.tmp
-i=2; cat host_list.tmp | while read in
-do
-    FOLDER_NAME=$(echo $(date '+%Y%m%d')_ANALYSIS0${i}_${ANALYSIS_TYPE}_${in})
-    mkdir ${FOLDER_NAME}
-    cp create_summary_report.sh ${FOLDER_NAME}/
-    cp deduplicate_long_table.sh ${FOLDER_NAME}/
-    cp percentajeNs.py ${FOLDER_NAME}/
-    grep -i ${in} samples_ref.txt | cut -f1,2 > ${FOLDER_NAME}/samples_ref.txt
-    echo "ln -s ../00-reads ." > ${FOLDER_NAME}/lablog
-    printf "ln -s ../samples_id.txt .\n\n" >> ${FOLDER_NAME}/lablog
-    echo "# module load Nextflow/22.10.1 singularity" >> ${FOLDER_NAME}/lablog
-    echo "" >> ${FOLDER_NAME}/lablog
-    printf 'scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")\n\n' >> ${FOLDER_NAME}/lablog
-    cut -f2 ${FOLDER_NAME}/samples_ref.txt | sort -u | while read ref
-    do
-        echo "sample,fastq_1,fastq_2" > ${FOLDER_NAME}/samplesheet_${ref}.csv
-        grep -i ${ref} ${FOLDER_NAME}/samples_ref.txt | while read samples
-        do
-            arr=($samples); echo "${arr[0]},00-reads/${arr[0]}_R1.fastq.gz,00-reads/${arr[0]}_R2.fastq.gz" >> ${FOLDER_NAME}/samplesheet_${ref}.csv
-        done
-        REF_FASTA=$(find /data/bi/references/virus/ -name ${ref}.fasta)
-        REF_GFF=$(find /data/bi/references/virus/ -name ${ref}.gff)
-        echo "cat <<EOF > ${ref}_viralrecon.sbatch" >> ${FOLDER_NAME}/lablog
-        echo "#!/bin/sh" >> ${FOLDER_NAME}/lablog
-        echo "#SBATCH --ntasks 1" >> ${FOLDER_NAME}/lablog
-        echo "#SBATCH --cpus-per-task 2" >> ${FOLDER_NAME}/lablog
-        echo "#SBATCH --mem 4G" >> ${FOLDER_NAME}/lablog
-        echo "#SBATCH --time 2:00:00" >> ${FOLDER_NAME}/lablog
-        echo "#SBATCH --partition middle_idx" >> ${FOLDER_NAME}/lablog
-        echo "#SBATCH --output ${ref}_$(date '+%Y%m%d')_viralrecon.log" >> ${FOLDER_NAME}/lablog
-        printf "#SBATCH --chdir \$scratch_dir\n\n" >> ${FOLDER_NAME}/lablog
-        printf 'export NXF_OPTS="-Xms500M -Xmx4G"\n\n' >> ${FOLDER_NAME}/lablog
-        echo "nextflow run /data/bi/pipelines/nf-core-viralrecon-2.6.0/workflow/main.nf \\\\" >> ${FOLDER_NAME}/lablog
-        echo "          -c ${CONFIG_FILE} \\\\" >> ${FOLDER_NAME}/lablog
-        echo "          -params-file ${PARAMS_FILE} \\\\" >> ${FOLDER_NAME}/lablog
-        echo "          --input samplesheet_${ref}.csv \\\\" >> ${FOLDER_NAME}/lablog
-        echo "          --outdir ${ref}_$(date '+%Y%m%d')_viralrecon_mapping \\\\" >> ${FOLDER_NAME}/lablog
-        echo "          --fasta ${REF_FASTA} \\\\" >> ${FOLDER_NAME}/lablog
-        echo "          --gff ${REF_GFF} \\\\" >> ${FOLDER_NAME}/lablog
-        echo "          -resume" >> ${FOLDER_NAME}/lablog
-        printf "EOF\n\n" >> ${FOLDER_NAME}/lablog
-        printf "echo 'sbatch ${ref}_viralrecon.sbatch' > _01_run_${ref}_viralrecon.sh\n\n" >> ${FOLDER_NAME}/lablog
-    done
-  echo "# conda activate python3" >> ${FOLDER_NAME}/lablog
-
-  cp _02_create_run_percentage_Ns.sh ${FOLDER_NAME}/
-  printf 'echo "bash create_summary_report.sh" > _04_create_stats_table.sh\n\n' >> ${FOLDER_NAME}/lablog
-  cp create_assembly_stats.R ${FOLDER_NAME}/
-  echo "# module load R/4.2.1" >> ${FOLDER_NAME}/lablog
-  printf 'echo "Rscript create_assembly_stats.R" > _05_create_stats_assembly.sh\n\n' >> ${FOLDER_NAME}/lablog
-  printf 'echo "bash deduplicate_long_table.sh" > _06_deduplicate_long_table.sh\n\n' >> ${FOLDER_NAME}/lablog
-
-    i=$((i+1))
-done
-rm host_list.tmp
-rm create_summary_report.sh
-rm deduplicate_long_table.sh
-rm percentajeNs.py
-rm _02_create_run_percentage_Ns.sh
-
-# Exclusive of genomeev and viral_discovery service, if you see this anywhere else, somebody has copied without reading (https://youtu.be/AgGtGORPHcM?t=4)
-mv ANALYSIS03_MAG $(date '+%Y%m%d')_ANALYSIS03_MAG
-mv ANALYSIS04_BLAST $(date '+%Y%m%d')_ANALYSIS04_BLAST
diff --git a/bu_isciii/templates/genomeev/ANALYSIS/percentajeNs.py b/bu_isciii/templates/genomeev/ANALYSIS/percentajeNs.py
deleted file mode 100644
index c2552969c..000000000
--- a/bu_isciii/templates/genomeev/ANALYSIS/percentajeNs.py
+++ /dev/null
@@ -1,21 +0,0 @@
-from Bio import SeqIO
-import os
-import argparse
-
-parser = argparse.ArgumentParser(description="Count %Ns")
-parser.add_argument("input_dir", type=str, help="Input dir masked files")
-parser.add_argument("output_file", type=str, help="Output file for Ns count")
-args = parser.parse_args()
-
-out_handle = open(args.output_file, "w")
-
-for f in os.listdir(args.input_dir):
-    if f.endswith(".consensus.fa"):
-        ffpath = os.path.join(args.input_dir, f)
-        for record in SeqIO.parse(ffpath, "fasta"):
-            n_count = record.seq.count("N") + record.seq.count("n")
-            out_handle.write(
-                "%s\t%0.2f\n" % (record.description, n_count * 100.0 / len(record))
-            )
-
-out_handle.close()
diff --git a/bu_isciii/templates/genomeev/ANALYSIS/samples_ref.txt b/bu_isciii/templates/genomeev/ANALYSIS/samples_ref.txt
deleted file mode 100644
index 5e3528b12..000000000
--- a/bu_isciii/templates/genomeev/ANALYSIS/samples_ref.txt
+++ /dev/null
@@ -1,4 +0,0 @@
-SampleID	Reference	Host
-SampleID	Reference	Host
-SampleID	Reference	Host
-
diff --git a/bu_isciii/templates/genomeev/DOC/hpc_slurm_pikavirus.config b/bu_isciii/templates/genomeev/DOC/hpc_slurm_pikavirus.config
deleted file mode 100644
index 2517ff51d..000000000
--- a/bu_isciii/templates/genomeev/DOC/hpc_slurm_pikavirus.config
+++ /dev/null
@@ -1,32 +0,0 @@
-/*
- * ---------------------------------------------------------------
- *  Nextflow config file for the ISCIII High Performance Computer
- * ---------------------------------------------------------------
- *
- *   nextflow run PikaVirus/manin.nf -profile HPC_ISCIII, <docker/singularity/conda>
- */
-
-process{
-  executor = 'slurm'
-  queue = 'middle_idx'
-  conda = '/data/bi/pipelines/miniconda3/envs/PikaVirus'
-  errorStrategy = { task.exitStatus in [140,143,137,138,104,134,139] ? 'retry' : 'finish'; task.exitStatus in [1,4,255] ? 'ignore' : 'finish' }
-  maxRetries = 5
-  maxErrors = '-1'
-}
-
-params {
-  config_profile_name = 'ISCIII HPC profile'
-  config_profile_description = 'Profile designed for the High Performance Computer in the ISCIII'
-  kraken2_db = "/data/bi/references/kraken/minikraken_8GB_20200312"
-  vir_ref_dir = "/data/bi/references/PikaVirus/viral_assemblies_for_pikavirus"
-  vir_dir_repo = "/data/bi/references/PikaVirus/viral_assemblies.tsv"
-  bact_ref_dir = "/data/bi/references/PikaVirus/bacteria_assemblies_for_pikavirus"
-  bact_dir_repo = "/data/bi/references/PikaVirus/bacteria_assemblies.tsv"
-  fungi_ref_dir = "/data/bi/references/PikaVirus/fungi_assemblies_for_pikavirus"
-  fungi_dir_repo = "/data/bi/references/PikaVirus/fungi_assemblies.tsv"
-  outdir = "01-PikaVirus-results"
-  max_memory = 376.GB
-  max_cpus = 32
-  max_time = '48.h'
-}
diff --git a/bu_isciii/templates/genomeev/DOC/mag.config b/bu_isciii/templates/genomeev/DOC/mag.config
deleted file mode 100644
index 732980bf1..000000000
--- a/bu_isciii/templates/genomeev/DOC/mag.config
+++ /dev/null
@@ -1,19 +0,0 @@
-singularity {
-	enabled = true
-	autoMounts = true
-}
-
-process {
-	executor = 'slurm'
-	queue = 'middle_idx'
-	queue = 'middle_idx'
-        errorStrategy = { task.exitStatus in [140,143,137,138,104,134,139] ? 'retry' : 'finish'; task.exitStatus in [1,4,255] ? 'ignore' : 'finish' }
-        maxRetries = 1
-        maxErrors = '-1'
-}
-
-params {
-	max_memory = 376.GB
-	max_cpus = 32
-	max_time = '48.h'
-}
diff --git a/bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic.config b/bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic.config
deleted file mode 100644
index 66e8911f5..000000000
--- a/bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic.config
+++ /dev/null
@@ -1,19 +0,0 @@
-singularity {
-	enabled = true
-	autoMounts = true
-}
-
-process {
-	executor = 'slurm'
-	queue = 'middle_idx'
-	withName: 'FASTP' {
-            ext.args = '--cut_front --cut_tail --trim_poly_x --cut_mean_quality 20 --qualified_quality_phred 20 --unqualified_percent_limit 10 --length_required 50'
-        }
-}
-
-params {
-        // Max resource options
-	max_memory = 376.GB
-	max_cpus = 32
-	max_time = '48.h'
-}
diff --git a/bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic_ignore_merge_codons.config b/bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic_ignore_merge_codons.config
deleted file mode 100644
index bb575ee33..000000000
--- a/bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic_ignore_merge_codons.config
+++ /dev/null
@@ -1,42 +0,0 @@
-singularity {
-	enabled = true
-	autoMounts = true
-}
-
-process {
-	executor = 'slurm'
-	queue = 'middle_idx'
-	withName: 'FASTP' {
-            ext.args = '--cut_front --cut_tail --trim_poly_x --cut_mean_quality 20 --qualified_quality_phred 20 --unqualified_percent_limit 10 --length_required 50'
-        }
-        withName: 'PANGOLIN' {
-            ext.args = '--datadir /scratch/bi/references/pangolin/20220322'
-            container = 'https://depot.galaxyproject.org/singularity/pangolin:3.1.20--pyhdfd78af_0'
-        }
-	withName: 'IVAR_VARIANTS_TO_VCF' {
-            ext.args = params.protocol == 'amplicon' ? '--ignore_strand_bias --ignore_merge_codons' : '--ignore_merge_codons'
-        }
-}
-
-params {
-        // Input options
-        platform=illumina
-        protocol=metagenomic
-
-        // Illumina QC, read trimming and filtering options
-        kraken2_db="/data/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz"
-
-        // Illumina variant calling options
-        variant_caller=ivar
-        consensus_caller=bcftools
-        skip_pangolin=true
-        skip_nextclade=true
-        
-        // Illumina de novo assembly options
-        skip_assembly=true
-
-        // Max resource options
-	max_memory = 376.GB
-	max_cpus = 32
-	max_time = '48.h'
-}
diff --git a/bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic_params.yml b/bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic_params.yml
deleted file mode 100644
index 7ef761860..000000000
--- a/bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic_params.yml
+++ /dev/null
@@ -1,11 +0,0 @@
-platform: 'illumina'
-protocol: 'metagenomic'
-kraken2_db: '/data/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz'
-variant_caller: 'ivar' 
-consensus_caller: 'bcftools'
-skip_pangolin: true
-skip_nextclade: true
-skip_variants: true
-skip_assembly: false
-skip_abacas: true
-skip_plasmidid: true
diff --git a/bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic_save_nohost.config b/bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic_save_nohost.config
deleted file mode 100644
index a62b5ac42..000000000
--- a/bu_isciii/templates/genomeev/DOC/viralrecon_metagenomic_save_nohost.config
+++ /dev/null
@@ -1,40 +0,0 @@
-singularity {
-	enabled = true
-	autoMounts = true
-}
-
-process {
-	executor = 'slurm'
-	queue = 'middle_idx'
-	withName: 'FASTP' {
-            ext.args = '--cut_front --cut_tail --trim_poly_x --cut_mean_quality 20 --qualified_quality_phred 20 --unqualified_percent_limit 10 --length_required 50'
-        }
-        withName: 'KRAKEN2_KRAKEN2' {
-            publishDir = [
-                pattern: "*.{unclassified_1.fastq.gz,unclassified_2.fastq.gz,txt}"
-            ]
-        }
-}
-
-params {
-        // Input options
-        platform=illumina
-        protocol=metagenomic
-
-        // Illumina QC, read trimming and filtering options
-        kraken2_db="/data/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz"
-
-        // Illumina variant calling options
-        variant_caller=ivar
-        consensus_caller=bcftools
-        skip_pangolin=true
-        skip_nextclade=true
-        
-        // Illumina de novo assembly options
-        skip_assembly=true
-
-        // Max resource options
-	max_memory = 376.GB
-	max_cpus = 32
-	max_time = '48.h'
-}
diff --git a/bu_isciii/templates/genomeev/RAW/README b/bu_isciii/templates/genomeev/RAW/README
deleted file mode 100644
index deb5220b4..000000000
--- a/bu_isciii/templates/genomeev/RAW/README
+++ /dev/null
@@ -1 +0,0 @@
-RAW template
diff --git a/bu_isciii/templates/genomeev/RESULTS/lablog_genomeev_results b/bu_isciii/templates/genomeev/RESULTS/lablog_genomeev_results
deleted file mode 100644
index c593c7acb..000000000
--- a/bu_isciii/templates/genomeev/RESULTS/lablog_genomeev_results
+++ /dev/null
@@ -1,17 +0,0 @@
-# conda activate 2excel
-mkdir $(date '+%Y%m%d')_entrega01
-cd $(date '+%Y%m%d')_entrega01
-
-#Create directories depending on the analysis
-mkdir assembly_spades
-mkdir blast
-
-#Create symbolic links depending on the analysis
-#Individual files
-ln -s ../../ANALYSIS/*_MAG/99-stats/multiqc_report.html ./krona_results.html
-ln -s ../../ANALYSIS/*/assembly_stats.xlsx ./assembly_stats.xlsx
-python /scratch/bi/pipelines/utilities/export_excel_from_csv.py --input_file ../../ANALYSIS/*PIKAVIRUS*/*/all_samples_virus_table_filtered.tsv --delimiter '\t' --output_filename filtered_all_samples_virus_table --it_has_index --it_has_header
-
-#Folders
-cd assembly_spades; ln -s ../../../ANALYSIS/*BLAST*/*/*scaffolds.fa .; cd -
-cd blast; ln -s ../../../ANALYSIS/*BLAST*/all_samples_filtered_BLAST_results.xlsx .; ln -s ../../../ANALYSIS/*BLAST*/*/*.xlsx .; cd -
diff --git a/bu_isciii/templates/genomeev/TMP/README b/bu_isciii/templates/genomeev/TMP/README
deleted file mode 100644
index 36ecd8ddc..000000000
--- a/bu_isciii/templates/genomeev/TMP/README
+++ /dev/null
@@ -1 +0,0 @@
-TMP templates
diff --git a/bu_isciii/templates/mtbseq_assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog b/bu_isciii/templates/mtbseq_assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
deleted file mode 100644
index 2124059d3..000000000
--- a/bu_isciii/templates/mtbseq_assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
+++ /dev/null
@@ -1,37 +0,0 @@
-# module load Nextflow/21.10.6 singularity
-
-ln -s ../00-reads .
-ln -s ../samples_id.txt .
-
-echo "sample,fastq_1,fastq_2" > samplesheet.csv
-cat samples_id.txt | while read in; do echo "${in},00-reads/${in}_R1.fastq.gz,00-reads/${in}_R2.fastq.gz"; done >> samplesheet.csv
-
-#module load Nextflow singularity
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-
-cat <<EOF > assembly.sbatch
-#!/bin/sh
-#SBATCH --ntasks 1
-#SBATCH --cpus-per-task 2
-#SBATCH --mem 8G
-#SBATCH --time 8:00:00
-#SBATCH --partition middle_idx
-#SBATCH --output $(date '+%Y%m%d')_assembly01.log
-#SBATCH --chdir $scratch_dir
-
-export NXF_OPTS="-Xms500M -Xmx4G"
-
-nextflow run /scratch/bi/pipelines/BU_ISCIII-bacterial-assembly/main.nf \\
-          -c ../../DOC/hpc_slurm_assembly.config \\
-          --input samplesheet.csv \\
-          --outdir ./ \\
-          --cut_mean_quality 20 \\
-          --qualified_quality_phred 20 \\
-          --gram + \\
-	  --save_trimmed true \\
-          --kmerfinder_bacteria_database '/data/bi/references/kmerfinder/20190108_stable_dirs/bacteria' \\
-          --reference_ncbi_bacteria '/data/bi/references/bacteria/latest_db/assembly_summary_bacteria.txt' \\
-          -resume
-EOF
-
-echo "sbatch assembly.sbatch" > _01_nf_assembly.sh
diff --git a/bu_isciii/templates/mtbseq_assembly/ANALYSIS/ANALYSIS02_MTBSEQ/lablog b/bu_isciii/templates/mtbseq_assembly/ANALYSIS/ANALYSIS02_MTBSEQ/lablog
deleted file mode 100644
index 73d719fe1..000000000
--- a/bu_isciii/templates/mtbseq_assembly/ANALYSIS/ANALYSIS02_MTBSEQ/lablog
+++ /dev/null
@@ -1,21 +0,0 @@
-# module load singularity
-# NOTE: error Java version is fixed by using module purge
-mkdir logs
-scratch_dir=$(echo $(pwd) | sed "s@/data/bi/scratch_tmp/@/scratch/@g")
-
-cat ../samples_id.txt | xargs -I % echo "mkdir %; cd %; ln -s ../../*ANALYSIS01*/01-preprocessing/trimmed_sequences/%_1.trim.fastq.gz %_lib1_R1.fastq.gz; cd -" | bash
-cat ../samples_id.txt | xargs -I % echo "cd %; ln -s ../../*ANALYSIS01*/01-preprocessing/trimmed_sequences/%_2.trim.fastq.gz %_lib1_R2.fastq.gz; cd -" | bash
-cat ../samples_id.txt | xargs -I % echo "cd %; ls *.fastq.gz | tr '_' '\t' | cut -f 1,2 | sort -u > samples.txt; cd -" | bash
-
-cat ../samples_id.txt | xargs -I @@ echo -e "srun --job-name MTBSEQ.@@  --output logs/MTBSEQ.@@.%j.log --partition middle_idx --mem 100G --chdir ${scratch_dir}/@@ --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/mtbseq:1.0.4--hdfd78af_2 MTBseq --step TBfull --threads 10 --samples samples.txt &" > _01_mtbseq.sh
-
-# classification
-YEAR=$(date +%Y)
-echo "mkdir classification_all" > _02_gather_results.sh
-echo "FIRST_SAMPLE=$( head -n1 ../samples_id.txt ); head -n 1 \${FIRST_SAMPLE}/Classification/Strain_Classification.tab > classification_all/strain_classification_all.tab; grep \"^'${YEAR}\" */Classification/Strain_Classification.tab | cut -d \":\" -f 2 >> classification_all/strain_classification_all.tab" >> _02_gather_results.sh
-# resistances
-echo "mkdir resistances_all" >> _02_gather_results.sh
-cat ../samples_id.txt | xargs -I % echo "cp %/Amend/NONE_joint_cf4_cr4_fr75_ph4_samples1_amended.tab resistances_all/%_var_res.tab" >> _02_gather_results.sh
-# stats
-echo "mkdir stats_all" >> _02_gather_results.sh
-echo "FIRST_SAMPLE=$(head -n1 ../samples_id.txt); head -n 1 \$FIRST_SAMPLE/Statistics/Mapping_and_Variant_Statistics.tab > stats_all/statistics_all.tab; grep \"^'${YEAR}\" */Statistics/Mapping_and_Variant_Statistics.tab | cut -d \":\" -f 2 >> stats_all/statistics_all.tab" >> _02_gather_results.sh
diff --git a/bu_isciii/templates/mtbseq_assembly/ANALYSIS/ANALYSIS02_MTBSEQ/samples_all/lablog b/bu_isciii/templates/mtbseq_assembly/ANALYSIS/ANALYSIS02_MTBSEQ/samples_all/lablog
deleted file mode 100644
index 3fd8c8dfc..000000000
--- a/bu_isciii/templates/mtbseq_assembly/ANALYSIS/ANALYSIS02_MTBSEQ/samples_all/lablog
+++ /dev/null
@@ -1,22 +0,0 @@
-# module load singularity
-# this will be performed in case a tree is requested
-mkdir logs
-scratch_dir=$(echo $(pwd) | sed "s@/data/bi/scratch_tmp/@/scratch/@g")
-
-mkdir Amend Bam Called Classification GATK_Bam Groups Joint Mpileup Position_Tables Statistics
-cat ../*/samples.txt > samples.txt
-
-#### Create symbolic links to the folders already created
-cd Bam; ln -s ../../*/Bam/* . ; cd -
-cd Called; ln -s ../../*/Called/* . ; cd -
-cd GATK_Bam; ln -s ../../*/GATK_Bam/* . ; cd -
-cd Mpileup; ln -s ../../*/Mpileup/* . ; cd -
-cd Position_Tables; ln -s ../../*/Position_Tables/* . ; cd -
-
-##### Create join scripts
-echo "srun --job-name MTBSEQ_JOIN  --output logs/MTBSEQ_JOIN.%j.log --partition middle_obx --mem 48G --chdir ${scratch_dir} --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/mtbseq:1.0.4--hdfd78af_2 MTBseq --step TBjoin --threads 5 --samples ${scratch_dir}/samples.txt &" > _01_tb_join.sh
-echo "srun --job-name MTBSEQ_AMEND  --output logs/MTBSEQ_AMEND.%j.log --partition middle_obx --mem 48G --chdir ${scratch_dir} --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/mtbseq:1.0.4--hdfd78af_2 MTBseq --step TBamend --threads 5 --samples ${scratch_dir}/samples.txt &" > _02_tb_amend.sh
-echo "srun --job-name MTBSEQ_GROUPS --output logs/MTBSEQ_GROUPS.%j.log --partition middle_obx --mem 48G --chdir ${scratch_dir} --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/mtbseq:1.0.4--hdfd78af_2 MTBseq --step TBgroups --threads 5 --samples ${scratch_dir}/samples.txt &" > _03_tb_groups.sh
-
-##### Execute iqtree
-echo "srun --chdir ${scratch_dir} --output logs/IQTREEFULLALIGN.%j.log --job-name IQTREEFULLALIGN --cpus-per-task 20 --mem 15G --partition short_idx --time 08:00:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/Amend/*amended_u95_phylo_w12.plainIDs.fasta -m K3Pu+F+I -T 20 -B 1000 -pre phylo.iqtree.bootstrap &" > _04_iqtreeall.sh
diff --git a/bu_isciii/templates/mtbseq_assembly/ANALYSIS/lablog b/bu_isciii/templates/mtbseq_assembly/ANALYSIS/lablog
deleted file mode 100644
index 05094a174..000000000
--- a/bu_isciii/templates/mtbseq_assembly/ANALYSIS/lablog
+++ /dev/null
@@ -1,6 +0,0 @@
-mkdir -p 00-reads
-mkdir -p $(date '+%Y%m%d')_ANALYSIS01_ASSEMBLY
-mkdir -p $(date '+%Y%m%d')_ANALYSIS02_MTBSEQ
-ls ../RAW/*.gz | cut -d "/" -f3 | cut -d "_" -f1 | sort -u > samples_id.txt
-cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R1*.fastq.gz %_R1.fastq.gz" | bash; cd -
-cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R2*.fastq.gz %_R2.fastq.gz" | bash; cd -
\ No newline at end of file
diff --git a/bu_isciii/templates/mtbseq_assembly/DOC/README b/bu_isciii/templates/mtbseq_assembly/DOC/README
deleted file mode 100644
index b9ad751ba..000000000
--- a/bu_isciii/templates/mtbseq_assembly/DOC/README
+++ /dev/null
@@ -1 +0,0 @@
-DOC template
diff --git a/bu_isciii/templates/mtbseq_assembly/DOC/hpc_slurm_assembly.config b/bu_isciii/templates/mtbseq_assembly/DOC/hpc_slurm_assembly.config
deleted file mode 100644
index 9af022258..000000000
--- a/bu_isciii/templates/mtbseq_assembly/DOC/hpc_slurm_assembly.config
+++ /dev/null
@@ -1,27 +0,0 @@
-conda   {
-	enabled = true
-	autoMounts = true
-}
-
-singularity {
-	enabled = true
-	autoMounts = true
-}
-
-process {
-	executor = 'slurm'
-	queue = 'middle_idx'
-        conda = '/data/bi/pipelines/miniconda3/envs/assembly'
-        errorStrategy = { task.exitStatus in [140,143,137,138,104,134,139] ? 'retry' : 'finish'; task.exitStatus in [1,4,255] ? 'ignore' : 'finish' }
-        maxRetries = 1
-        maxErrors = '-1'
-        withName:KMERFINDER {
-          container = '/scratch/bi/singularity-images/kmerfinder_v3.0.2.sif'
-        }
-}
-
-params {
-	max_memory = 376.GB
-	max_cpus = 32
-	max_time = '48.h'
-}
diff --git a/bu_isciii/templates/mtbseq_assembly/RAW/README b/bu_isciii/templates/mtbseq_assembly/RAW/README
deleted file mode 100644
index deb5220b4..000000000
--- a/bu_isciii/templates/mtbseq_assembly/RAW/README
+++ /dev/null
@@ -1 +0,0 @@
-RAW template
diff --git a/bu_isciii/templates/mtbseq_assembly/REFERENCES/README b/bu_isciii/templates/mtbseq_assembly/REFERENCES/README
deleted file mode 100644
index 834c3390f..000000000
--- a/bu_isciii/templates/mtbseq_assembly/REFERENCES/README
+++ /dev/null
@@ -1 +0,0 @@
-REFERENCES template
diff --git a/bu_isciii/templates/mtbseq_assembly/RESULTS/README b/bu_isciii/templates/mtbseq_assembly/RESULTS/README
deleted file mode 100644
index 5f9902779..000000000
--- a/bu_isciii/templates/mtbseq_assembly/RESULTS/README
+++ /dev/null
@@ -1 +0,0 @@
-RESULTS templates
diff --git a/bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results b/bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results
deleted file mode 100644
index d2bf377f2..000000000
--- a/bu_isciii/templates/mtbseq_assembly/RESULTS/lablog_mtbseq_assembly_results
+++ /dev/null
@@ -1,9 +0,0 @@
-DELIVERY_FOLDER="$(date '+%Y%m%d')_entrega"
-
-mkdir $DELIVERY_FOLDER
-
-# MTBSEQ-ASSEMBLY service
-cd $DELIVERY_FOLDER
-
-# Links to reports
-ln -s ../../ANALYSIS/*ASSEMBLY/99-stats/MultiQC/multiqc_report.html .
diff --git a/bu_isciii/templates/mtbseq_assembly/TMP/README b/bu_isciii/templates/mtbseq_assembly/TMP/README
deleted file mode 100644
index 36ecd8ddc..000000000
--- a/bu_isciii/templates/mtbseq_assembly/TMP/README
+++ /dev/null
@@ -1 +0,0 @@
-TMP templates

From 02379547864fc72b4b7f8ef96a9631ab60d7109b Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 4 Jul 2024 12:53:02 +0200
Subject: [PATCH 089/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 253b5add6..37427a03c 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -51,7 +51,7 @@ Code contributions to the new version:
 - Added MAG tempalte and removed MAG from other templates [#288](https://github.com/BU-ISCIII/buisciii-tools/pull/288)
 - Added amrfinderplus to characterization template. [#289] (https://github.com/BU-ISCIII/buisciii-tools/pull/289)
 - Updated all files so that paths referring to /pipelines/ are updated according to the new structure [#287](https://github.com/BU-ISCIII/buisciii-tools/pull/287)
-- Updated assembly's template (lablog and config files) [#295](https://github.com/BU-ISCIII/buisciii-tools/pull/295)
+- Updated assembly, ariba, snippy and amrfinderplus templates, removed genomeev and mtbseq_assembly templates and updated services.json [#295](https://github.com/BU-ISCIII/buisciii-tools/pull/295)
 
 ### Modules
 

From 31535cf704361fc95b227199352042cdfdcaa7e6 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 4 Jul 2024 13:31:00 +0200
Subject: [PATCH 090/321] Updated iqtree lablog

---
 .../snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog        | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog
index e351131c1..f40bd67d9 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog
@@ -2,5 +2,5 @@
 
 scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
 mkdir logs
-#echo "srun --chdir \${scratch_dir} --output logs/IQTREEMFP.%j.log --job-name IQTREEMFP --cpus-per-task 20 --mem 5G --partition short_idx --time 00:30:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../04-snippy/phylo.aln -m MFP &" > _00_iqtreemfp.sh
-echo "srun --chdir ${scratch_dir} --output logs/IQTREEFULLALIGN.%j.log --job-name IQTREEFULLALIGN --cpus-per-task 20 --mem 15G --partition short_idx --time 08:00:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../04-snippy/phylo.aln -m PMB+F+R2 -T 20 -B 1000 -pre phylo.iqtree.bootstrap &" > _01_iqtreeall.sh
+#echo "srun --chdir ${scratch_dir} --output logs/IQTREEMFP.%j.log --job-name IQTREEMFP --cpus-per-task 20 --mem 5G --partition short_idx --time 00:30:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../04-snippy/phylo.aln -m MFP &" > _00_iqtreemfp.sh
+echo "srun --chdir ${scratch_dir} --output logs/IQTREEFULLALIGN.%j.log --job-name IQTREEFULLALIGN --cpus-per-task 20 --mem 15G --partition short_idx --time 08:00:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../04-snippy/phylo.aln -m HKY+F+I -T 20 -B 1000 -pre phylo.iqtree.bootstrap &" > _01_iqtreeall.sh

From f8fb17ebb38eed15cffb80a1d112237e7fb29e63 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 4 Jul 2024 13:35:15 +0200
Subject: [PATCH 091/321] Updated snippy lablog

---
 .../snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog   | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog
index c67c2a06d..2db8ad881 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog
@@ -23,9 +23,12 @@ echo "srun --chdir ${scratch_dir} --output logs/SNIP-SITES.%j.log --job-name SNI
 
 # awk 'BEGIN{FS="[> ]"} /^>/{val=$2;next}  {print val,length($0)}' phylo.aln
 
+#code to compare samples inpairs
+# awk '$4 != $5 || $4 != $6 || $5 != $6' core.tab > differences.txt
+
 ## GUBBINS commands
-echo "snippy-clean_full_aln core.full.aln > clean.full.aln" > _03_gubbins.sh
-echo "run_gubbins.py --threads 20 -p gubbins clean.full.aln" >> _03_gubbins.sh
-echo "snp-sites -c gubbins.filtered_polymorphic_sites.fasta > clean.core.aln" >> _03_gubbins.sh
+echo "env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 snippy-clean_full_aln core.full.aln > clean.full.aln" > _03_gubbins.sh
+echo "singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gubbins:3.3.5--py39pl5321he4a0461_0 run_gubbins.py --threads 20 -p gubbins clean.full.aln" >> _03_gubbins.sh
+echo "env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 snp-sites -c gubbins.filtered_polymorphic_sites.fasta > clean.core.aln" >> _03_gubbins.sh
 # Run gubbins
 echo "srun --chdir ${scratch_dir} --output logs/GUBBINS.%j.log --job-name GUBBINS --cpus-per-task 20 --mem 49152 --partition short_idx --time 02:00:00 bash _03_gubbins.sh &" > _03_run_gubbins.sh

From 318543bce3f5fe3e5620a20db1f94341a9755b4d Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 4 Jul 2024 16:20:26 +0200
Subject: [PATCH 092/321] Fixed minor mistakes in snippy's lablog

---
 .../snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog        | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog
index 2db8ad881..6154d78bf 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog
@@ -1,4 +1,4 @@
-# conda activate snippy
+# module load singularity
 
 scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
 
@@ -6,7 +6,7 @@ mkdir logs
 
 cat ../samples_id.txt | while read in; do echo -e "${in}\t${scratch_dir}/../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz\t${scratch_dir}/../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz"; done >> input.tab
 
-singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 snippy-multi ${scratch_dir}/input.tab --mincov 9 --mapqual 10 --basequal 5 --minqual 30 --ref ${scratch_dir}/../../../REFERENCES/GCF_015326295.1/GCF_015326295.1_ASM1532629v1_genomic.fna --cpus 5 > commands.out
+ls ${scratch_dir}/../../../REFERENCES | xargs -I %% singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 snippy-multi ${scratch_dir}/input.tab --mincov 9 --mapqual 10 --basequal 5 --minqual 30 --ref ${scratch_dir}/../../../REFERENCES/%% --cpus 5 > commands.out
 
 head -n -1 commands.out | sed -e "s@^@srun --chdir ${scratch_dir} --output logs/SNIPPY.%j.log --job-name SNIPPY --cpus-per-task 5 --mem 49152 --partition short_idx --time 02:00:00 env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 @" | awk '{print $0" &"}' > _00_snippy.sh
 tail -n 1 commands.out | sed -e "s@^@srun --chdir ${scratch_dir} --output logs/SNIPPY_CORE.%j.log --job-name SNIPPY --cpus-per-task 5 --mem 49152 --partition short_idx --time 02:00:00 env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 @" | awk '{print $0" &"}' > _01_snippy_core.sh

From 81125321f63d395ae11a344d083daae309a9d244 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 4 Jul 2024 16:23:34 +0200
Subject: [PATCH 093/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 37427a03c..b97d8b2e3 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -51,7 +51,7 @@ Code contributions to the new version:
 - Added MAG tempalte and removed MAG from other templates [#288](https://github.com/BU-ISCIII/buisciii-tools/pull/288)
 - Added amrfinderplus to characterization template. [#289] (https://github.com/BU-ISCIII/buisciii-tools/pull/289)
 - Updated all files so that paths referring to /pipelines/ are updated according to the new structure [#287](https://github.com/BU-ISCIII/buisciii-tools/pull/287)
-- Updated assembly, ariba, snippy and amrfinderplus templates, removed genomeev and mtbseq_assembly templates and updated services.json [#295](https://github.com/BU-ISCIII/buisciii-tools/pull/295)
+- Updated assembly, ariba, snippy, amrfinderplus and iqtree templates, removed genomeev and mtbseq_assembly templates and updated services.json [#295](https://github.com/BU-ISCIII/buisciii-tools/pull/295)
 
 ### Modules
 

From 130c402013078104fa2a3e6988766fd90798c0c5 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 9 Jul 2024 16:32:09 +0200
Subject: [PATCH 094/321] Updated lablog so that references are directly
 available in refgenie

---
 .../viralrecon/ANALYSIS/lablog_viralrecon     | 93 ++++++++++++-------
 1 file changed, 57 insertions(+), 36 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 3a81fc18a..824278ca3 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -133,7 +133,7 @@ update_nextclade() {
     echo
 }
 
-# Checks if fasta and gff references are downloaded. If not, it downloades them (and create family folder if neccesary)
+# Checks if fasta and gff references are downloaded. If not, it downloads them (and creates family folder if neccesary)
 check_references() {
     echo
     echo_bold "Processing reference: ${ref}."
@@ -149,53 +149,74 @@ check_references() {
         if [ -z $family ]; then
             family=$(curl -s "https://www.ncbi.nlm.nih.gov/Taxonomy/Browser/wwwtax.cgi?id=${organism_id}" | grep -o 'ALT="family">.*<' | awk -F 'ALT="family">' '{print $2}' | cut -d '<' -f 1 | tr '[:upper:]' '[:lower:]')
         fi
-        echo "Reference $ref organism belongs to $family family."
+        echo "Reference $ref belongs to $family family."
     }
 
     # Check if FASTA sequence is already downloaded
-    REF_FASTA=$(find /data/bi/references/virus/ -maxdepth 2 -type f -name "${ref}.fa*" ! -name "*.fai")
-    if [ -z $REF_FASTA ]; then
+    obtain_family;
+    REF_FASTA=$(refgenie seek ${family}/fasta.fasta:${ref} -c /data/bi/references/refgenie/genome_config.yaml 2>&1)
+    if echo "$REF_FASTA" | grep -q "Traceback"; then 
         echo "File ${ref}.fasta is not yet downloaded."
-        obtain_family; if [ -z $family ]; then return; fi
-        if [ ! -e "/data/bi/references/virus/$family" ]; then # Check if directory doesn't exists
-            echo "Creating new directory: /data/bi/references/virus/${family}/"
-            mkdir /data/bi/references/virus/${family}/; chgrp bi /data/bi/references/virus/${family}/
-        else
-            echo "Directory /data/bi/references/virus/${family}/ ALREADY EXISTS."
-        fi
-        echo "Downloading ${ref}.fasta file..."
-        wget -q -O "/data/bi/references/virus/${family}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
-        if [ $? -eq 0 ]; then
-            REF_FASTA="/data/bi/references/virus/${family}/${ref}.fasta"
-            chgrp bi $REF_FASTA
-            echo_green "File ${ref}.fasta downloaded in $REF_FASTA."
+        if [ -z ${family} ]; then return; fi
+        if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exists
+            echo "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.fasta in /data/bi/references/refgenie/alias/${family}/fasta/${ref}."
+            digest=$(openssl rand -hex 24)
+            refgenie alias set --aliases ${family} --digest ${digest} -f -c /data/bi/references/refgenie/genome_config.yaml
+            mkdir -p /data/bi/references/refgenie/data/${digest}/fasta/${ref}/
+            wget -q -O "/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
+            if [ $? -eq 0 ]; then
+                echo_green "File ${ref}.fasta downloaded in $REF_FASTA."
+                refgenie add ${family}/fasta:${ref} --path data/${digest}/fasta/${ref}/ --seek-keys '{"fasta" : "'"${ref}.fasta"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+            else
+                echo_blinking_red "An error occurred during file downloading."
+            fi
         else
-            echo_blinking_red "An error occurred during file downloading."
+            echo "Directory /data/bi/references/refgenie/alias/${family}/ ALREADY EXISTS. Downloading ${ref}.fasta."
+            digest=$(refgenie alias get -a ${family} -c /data/bi/references/refgenie/genome_config.yaml)
+            mkdir -p /data/bi/references/refgenie/data/${digest}/fasta/${ref}/
+            wget -q -O "/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
+            if [ $? -eq 0 ]; then 
+                echo_green "File ${ref}.fasta downloaded in $REF_FASTA."
+                refgenie add ${family}/fasta:${ref} --path data/${digest}/fasta/${ref}/ --seek-keys '{"fasta" : "'"${ref}.fasta"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+            else
+                echo_blinking_red "An error occurred during file downloading."
+            fi
         fi
     else
-        echo -e "File ${ref}.fasta is ALREADY available in $REF_FASTA. \xE2\x9C\x85"
+        echo -e "File ${ref}.fasta is ALREADY available in $(dirname $REF_FASTA). \xE2\x9C\x85"
     fi
 
     # Check if GFF file is already downloaded
-    REF_GFF=$(find /data/bi/references/virus/ -maxdepth 2 -type f -name "${ref}.gff*")
-    if [ -z $REF_GFF ]; then
+    REF_GFF=$(refgenie seek ${family}/gff.gff:${ref} -c /data/bi/references/refgenie/genome_config.yaml 2>&1)
+    if echo "$REF_GFF" | grep -q "Traceback"; then 
         echo "File ${ref}.gff is not yet downloaded."
-        if [ ! -v family ]; then obtain_family; if [ -z $family ]; then return; fi; fi
-        if [ ! -e "/data/bi/references/virus/$family" ]; then
-            echo "Creating new directory: /data/bi/references/virus/${family}/"
-            mkdir /data/bi/references/virus/${family}/; chgrp bi /data/bi/references/virus/${family}/
-        fi
-        echo "Downloading ${ref}.gff file..."
-        wget -q -O "/data/bi/references/virus/${family}/${ref}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
-        if [ $? -eq 0 ]; then
-            REF_GFF="/data/bi/references/virus/${family}/${ref}.gff"
-            chgrp bi $REF_GFF
-            echo_green "File ${ref}.gff downloaded in $REF_GFF."
-        else
-            echo_blinking_red "An error occurred during file downloading."
-        fi
+        if [ ! -v ${family} ]; then obtain_family; if [ -z ${family} ]; then return; fi; fi
+        if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exist
+            echo "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.gff in /data/bi/references/refgenie/alias/${family}/gff/${ref}."
+            digest=$(openssl rand -hex 24)
+            refgenie alias set --aliases ${family} --digest ${digest} -f -c /data/bi/references/refgenie/genome_config.yaml
+            mkdir -p /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/
+            wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${ref}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
+            if [ $? -eq 0 ]; then
+                echo_green "File ${ref}.gff downloaded in $REF_GFF."
+                refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${ref}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+            else
+                echo_blinking_red "An error occurred during file downloading."
+            fi
+         else
+            echo "Directory /data/bi/references/refgenie/alias/${family}/ ALREADY EXISTS. Downloading ${ref}.gff."
+            digest=$(refgenie alias get -a ${family} -c /data/bi/references/refgenie/genome_config.yaml)
+            mkdir -p /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/
+            wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${ref}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
+            if [ $? -eq 0 ]; then 
+                echo_green "File ${ref}.gff downloaded in $REF_GFF."
+                refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${ref}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+            else
+                echo_blinking_red "An error occurred during file downloading."
+            fi
+         fi
     else
-        echo -e "File ${ref}.gff is ALREADY available in $REF_GFF. \xE2\x9C\x85"
+        echo -e "File ${ref}.gff is ALREADY available in $(dirname $REF_GFF). \xE2\x9C\x85"
     fi
 
     unset family

From 852b0111bdca39e1b64cadd1670a587d1b692ff0 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 9 Jul 2024 16:40:56 +0200
Subject: [PATCH 095/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index b97d8b2e3..b1be3e55b 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -52,6 +52,7 @@ Code contributions to the new version:
 - Added amrfinderplus to characterization template. [#289] (https://github.com/BU-ISCIII/buisciii-tools/pull/289)
 - Updated all files so that paths referring to /pipelines/ are updated according to the new structure [#287](https://github.com/BU-ISCIII/buisciii-tools/pull/287)
 - Updated assembly, ariba, snippy, amrfinderplus and iqtree templates, removed genomeev and mtbseq_assembly templates and updated services.json [#295](https://github.com/BU-ISCIII/buisciii-tools/pull/295)
+- Changed viralrecon's lablog so that references are available within refgenie [#296](https://github.com/BU-ISCIII/buisciii-tools/pull/296)
 
 ### Modules
 

From 0d53c4aeef9ecf16e2c70faae1cb7bae8d90a6b6 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 10 Jul 2024 16:22:06 +0200
Subject: [PATCH 096/321] Fixed minor mistake in the lablog

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 824278ca3..9d523a5ba 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -153,10 +153,10 @@ check_references() {
     }
 
     # Check if FASTA sequence is already downloaded
-    obtain_family;
     REF_FASTA=$(refgenie seek ${family}/fasta.fasta:${ref} -c /data/bi/references/refgenie/genome_config.yaml 2>&1)
     if echo "$REF_FASTA" | grep -q "Traceback"; then 
-        echo "File ${ref}.fasta is not yet downloaded."
+        obtain_family;
+	echo "File ${ref}.fasta is not yet downloaded."
         if [ -z ${family} ]; then return; fi
         if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exists
             echo "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.fasta in /data/bi/references/refgenie/alias/${family}/fasta/${ref}."

From 543c121c7609426b302584259ceec1a887191d5f Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 10 Jul 2024 16:40:02 +0200
Subject: [PATCH 097/321] Moved obtain_family function inside if statement, for
 speed purposes

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 9d523a5ba..669f1af0d 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -154,10 +154,9 @@ check_references() {
 
     # Check if FASTA sequence is already downloaded
     REF_FASTA=$(refgenie seek ${family}/fasta.fasta:${ref} -c /data/bi/references/refgenie/genome_config.yaml 2>&1)
-    if echo "$REF_FASTA" | grep -q "Traceback"; then 
-        obtain_family;
-	echo "File ${ref}.fasta is not yet downloaded."
-        if [ -z ${family} ]; then return; fi
+    if echo "$REF_FASTA" | grep -q "Traceback"; then
+        echo "File ${ref}.fasta is not yet downloaded."
+        obtain_family; if [ -z $family ]; then return; fi
         if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exists
             echo "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.fasta in /data/bi/references/refgenie/alias/${family}/fasta/${ref}."
             digest=$(openssl rand -hex 24)

From b6248bd89c59986f4d68012e6de560663fb7cf3d Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 11 Jul 2024 12:44:29 +0200
Subject: [PATCH 098/321] Moved obtain_family function out of the ifstatement,
 and removed some variables from places where they should not be

---
 .../viralrecon/ANALYSIS/lablog_viralrecon          | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 669f1af0d..8c58a3a98 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -153,10 +153,10 @@ check_references() {
     }
 
     # Check if FASTA sequence is already downloaded
+    obtain_family; if [ -z $family ]; then return; fi
     REF_FASTA=$(refgenie seek ${family}/fasta.fasta:${ref} -c /data/bi/references/refgenie/genome_config.yaml 2>&1)
     if echo "$REF_FASTA" | grep -q "Traceback"; then
         echo "File ${ref}.fasta is not yet downloaded."
-        obtain_family; if [ -z $family ]; then return; fi
         if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exists
             echo "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.fasta in /data/bi/references/refgenie/alias/${family}/fasta/${ref}."
             digest=$(openssl rand -hex 24)
@@ -164,7 +164,7 @@ check_references() {
             mkdir -p /data/bi/references/refgenie/data/${digest}/fasta/${ref}/
             wget -q -O "/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
             if [ $? -eq 0 ]; then
-                echo_green "File ${ref}.fasta downloaded in $REF_FASTA."
+                echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}"
                 refgenie add ${family}/fasta:${ref} --path data/${digest}/fasta/${ref}/ --seek-keys '{"fasta" : "'"${ref}.fasta"'"}' -c /data/bi/references/refgenie/genome_config.yaml
             else
                 echo_blinking_red "An error occurred during file downloading."
@@ -175,7 +175,7 @@ check_references() {
             mkdir -p /data/bi/references/refgenie/data/${digest}/fasta/${ref}/
             wget -q -O "/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
             if [ $? -eq 0 ]; then 
-                echo_green "File ${ref}.fasta downloaded in $REF_FASTA."
+                echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}"
                 refgenie add ${family}/fasta:${ref} --path data/${digest}/fasta/${ref}/ --seek-keys '{"fasta" : "'"${ref}.fasta"'"}' -c /data/bi/references/refgenie/genome_config.yaml
             else
                 echo_blinking_red "An error occurred during file downloading."
@@ -186,10 +186,10 @@ check_references() {
     fi
 
     # Check if GFF file is already downloaded
+    if [ ! -v family ]; then obtain_family; if [ -z ${family} ]; then return; fi; fi
     REF_GFF=$(refgenie seek ${family}/gff.gff:${ref} -c /data/bi/references/refgenie/genome_config.yaml 2>&1)
     if echo "$REF_GFF" | grep -q "Traceback"; then 
-        echo "File ${ref}.gff is not yet downloaded."
-        if [ ! -v ${family} ]; then obtain_family; if [ -z ${family} ]; then return; fi; fi
+        echo "File ${ref}.gff is not yet downloaded."        
         if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exist
             echo "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.gff in /data/bi/references/refgenie/alias/${family}/gff/${ref}."
             digest=$(openssl rand -hex 24)
@@ -197,7 +197,7 @@ check_references() {
             mkdir -p /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/
             wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${ref}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
             if [ $? -eq 0 ]; then
-                echo_green "File ${ref}.gff downloaded in $REF_GFF."
+                echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}"
                 refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${ref}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
             else
                 echo_blinking_red "An error occurred during file downloading."
@@ -208,7 +208,7 @@ check_references() {
             mkdir -p /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/
             wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${ref}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
             if [ $? -eq 0 ]; then 
-                echo_green "File ${ref}.gff downloaded in $REF_GFF."
+                echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}"
                 refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${ref}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
             else
                 echo_blinking_red "An error occurred during file downloading."

From 84d259687f5bf36d9393e2cae86fe6424a206502 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 22 Jul 2024 17:19:38 +0200
Subject: [PATCH 099/321] Updated services.json with the new bacass version,
 fixed a refgenie-related issue in viralrecon's lablog, fixed the wrong date
 grep issue in mtbseq's lablog and updated assembly's config file

---
 bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config   | 2 +-
 .../mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog       | 5 +++--
 bu_isciii/templates/services.json                            | 2 +-
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon    | 4 ++++
 4 files changed, 9 insertions(+), 4 deletions(-)

diff --git a/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config b/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config
index 284208fbb..8325bcd5f 100644
--- a/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config
+++ b/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config
@@ -217,7 +217,7 @@ process {
             saveAs: { filename -> filename.equals('versions.yml') ? null : filename }
         ]
     }
-    withName: 'MULTIQC' {
+    withName: 'MULTIQC_CUSTOM' {
         publishDir = [
             [ 
                 path: { "${params.outdir}/99-stats/multiqc" },
diff --git a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
index d60b322f2..0263c8986 100644
--- a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
+++ b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
@@ -2,6 +2,7 @@
 
 # srun parameters
 scratch_dir=$(echo $(pwd) | sed "s@/data/bi/scratch_tmp/@/scratch/@g" )
+analysis_year=$(pwd | awk -F'ANALYSIS/' '{print substr($2, 1, 4)}')
 
 mkdir logs
 cat ../samples_id.txt | xargs -I % echo "mkdir %; ln -s ../../01-preprocessing/%/%_R1_filtered.fastq.gz %/%_lib1_R1.fastq.gz" > _00_prepareRaw.sh
@@ -12,9 +13,9 @@ cat ../samples_id.txt | xargs -I @@ echo -e "srun --job-name MTBSEQ.@@  --output
 
 # classification
 echo "mkdir classification_all" > _03_gather_results.sh
-echo "FIRST_SAMPLE=$( head -n1 ../samples_id.txt ); head -n 1 \${FIRST_SAMPLE}/Classification/Strain_Classification.tab > classification_all/strain_classification_all.tab; grep \"^'2023\" */Classification/Strain_Classification.tab | cut -d \":\" -f 2 >> classification_all/strain_classification_all.tab" >> _03_gather_results.sh
+echo "FIRST_SAMPLE=$(head -n1 ../samples_id.txt); head -n1 ${FIRST_SAMPLE}/Classification/Strain_Classification.tab > classification_all/strain_classification_all.tab; grep \"^'$analysis_year\" */Classification/Strain_Classification.tab | cut -d ":" -f 2 >> classification_all/strain_classification_all.tab" >> _03_gather_results.sh
 # resistances
 echo "mkdir resistances_all" >> _03_gather_results.sh
 cat ../samples_id.txt | xargs -I % echo "cp %/Amend/NONE_joint_cf4_cr4_fr75_ph4_samples1_amended.tab resistances_all/%_var_res.tab" >> _03_gather_results.sh
 # stats
-echo "mkdir stats_all; FIRST_SAMPLE=$(head -n1 ../samples_id.txt); head -n 1 \$FIRST_SAMPLE/Statistics/Mapping_and_Variant_Statistics.tab > stats_all/statistics_all.tab; grep \"^'2023\" */Statistics/Mapping_and_Variant_Statistics.tab | cut -d \":\" -f 2 >> stats_all/statistics_all.tab" >> _03_gather_results.sh
+echo "mkdir stats_all; FIRST_SAMPLE=$(head -n1 ../samples_id.txt); head -n 1 "$FIRST_SAMPLE/Statistics/Mapping_and_Variant_Statistics.tab" > stats_all/statistics_all.tab; grep \"^'$analysis_year\" */Statistics/Mapping_and_Variant_Statistics.tab | cut -d ":" -f 2 >> stats_all/statistics_all.tab" >> _03_gather_results.sh
diff --git a/bu_isciii/templates/services.json b/bu_isciii/templates/services.json
index 3107c913f..c9e4a108f 100755
--- a/bu_isciii/templates/services.json
+++ b/bu_isciii/templates/services.json
@@ -2,7 +2,7 @@
     "assembly_annotation": {
         "label": "",
         "template": "assembly",
-        "url": "https://github.com/Daniel-VM/bacass/tree/buisciii-develop",
+        "url": "https://github.com/nf-core/bacass/tree/2.3.1",
         "order": 1,
         "begin": "",
         "end": "",
diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 8c58a3a98..a98cf487f 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -166,6 +166,7 @@ check_references() {
             if [ $? -eq 0 ]; then
                 echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}"
                 refgenie add ${family}/fasta:${ref} --path data/${digest}/fasta/${ref}/ --seek-keys '{"fasta" : "'"${ref}.fasta"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+                REF_FASTA=$(refgenie seek ${family}/fasta.fasta:${ref} -c /data/bi/references/refgenie/genome_config.yaml)
             else
                 echo_blinking_red "An error occurred during file downloading."
             fi
@@ -177,6 +178,7 @@ check_references() {
             if [ $? -eq 0 ]; then 
                 echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}"
                 refgenie add ${family}/fasta:${ref} --path data/${digest}/fasta/${ref}/ --seek-keys '{"fasta" : "'"${ref}.fasta"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+                REF_FASTA=$(refgenie seek ${family}/fasta.fasta:${ref} -c /data/bi/references/refgenie/genome_config.yaml)
             else
                 echo_blinking_red "An error occurred during file downloading."
             fi
@@ -199,6 +201,7 @@ check_references() {
             if [ $? -eq 0 ]; then
                 echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}"
                 refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${ref}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+                REF_GFF=$(refgenie seek ${family}/gff.gff:${ref} -c /data/bi/references/refgenie/genome_config.yaml)
             else
                 echo_blinking_red "An error occurred during file downloading."
             fi
@@ -210,6 +213,7 @@ check_references() {
             if [ $? -eq 0 ]; then 
                 echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}"
                 refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${ref}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+                REF_GFF=$(refgenie seek ${family}/gff.gff:${ref} -c /data/bi/references/refgenie/genome_config.yaml)
             else
                 echo_blinking_red "An error occurred during file downloading."
             fi

From d894ceee5828eba11572809424472d10fde5d823 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 22 Jul 2024 17:40:50 +0200
Subject: [PATCH 100/321] Removed some extra quotation marks from the mtbseq
 template

---
 .../mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog      | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
index 0263c8986..bc1c80fa8 100644
--- a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
+++ b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
@@ -12,10 +12,10 @@ cat ../samples_id.txt | xargs -I % echo "cd %;ls *.fastq.gz | tr '_' '\t' | cut
 cat ../samples_id.txt | xargs -I @@ echo -e "srun --job-name MTBSEQ.@@  --output logs/MTBSEQ.@@.%j.log --partition middle_idx --mem 48G --chdir ${scratch_dir}/@@ --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/mtbseq:1.0.4--hdfd78af_2 MTBseq --step TBfull --threads 10 --samples samples.txt &" > _02_mtbseq.sh
 
 # classification
-echo "mkdir classification_all" > _03_gather_results.sh
-echo "FIRST_SAMPLE=$(head -n1 ../samples_id.txt); head -n1 ${FIRST_SAMPLE}/Classification/Strain_Classification.tab > classification_all/strain_classification_all.tab; grep \"^'$analysis_year\" */Classification/Strain_Classification.tab | cut -d ":" -f 2 >> classification_all/strain_classification_all.tab" >> _03_gather_results.sh
+echo "mkdir classification_all" > _03_gather_results.sh 
+echo "FIRST_SAMPLE=$(head -n1 ../samples_id.txt); head -n 1 ${FIRST_SAMPLE}/Classification/Strain_Classification.tab > classification_all/strain_classification_all.tab; grep \"^'$analysis_year\" */Classification/Strain_Classification.tab | cut -d ":" -f 2 >> classification_all/strain_classification_all.tab" >> _03_gather_results.sh
 # resistances
 echo "mkdir resistances_all" >> _03_gather_results.sh
 cat ../samples_id.txt | xargs -I % echo "cp %/Amend/NONE_joint_cf4_cr4_fr75_ph4_samples1_amended.tab resistances_all/%_var_res.tab" >> _03_gather_results.sh
 # stats
-echo "mkdir stats_all; FIRST_SAMPLE=$(head -n1 ../samples_id.txt); head -n 1 "$FIRST_SAMPLE/Statistics/Mapping_and_Variant_Statistics.tab" > stats_all/statistics_all.tab; grep \"^'$analysis_year\" */Statistics/Mapping_and_Variant_Statistics.tab | cut -d ":" -f 2 >> stats_all/statistics_all.tab" >> _03_gather_results.sh
+echo "mkdir stats_all; FIRST_SAMPLE=$(head -n1 ../samples_id.txt); head -n 1 ${FIRST_SAMPLE}/Statistics/Mapping_and_Variant_Statistics.tab > stats_all/statistics_all.tab; grep \"^'$analysis_year\" */Statistics/Mapping_and_Variant_Statistics.tab | cut -d ":" -f 2 >> stats_all/statistics_all.tab" >> _03_gather_results.sh

From 5a75ae83d62028d451ae35ab8d4def951a499e42 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 22 Jul 2024 17:42:46 +0200
Subject: [PATCH 101/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index b1be3e55b..d82b79be0 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -53,6 +53,7 @@ Code contributions to the new version:
 - Updated all files so that paths referring to /pipelines/ are updated according to the new structure [#287](https://github.com/BU-ISCIII/buisciii-tools/pull/287)
 - Updated assembly, ariba, snippy, amrfinderplus and iqtree templates, removed genomeev and mtbseq_assembly templates and updated services.json [#295](https://github.com/BU-ISCIII/buisciii-tools/pull/295)
 - Changed viralrecon's lablog so that references are available within refgenie [#296](https://github.com/BU-ISCIII/buisciii-tools/pull/296)
+- Updated services.json, mtbseq's lablog, viralrecon's lablog and assembly's config file [#299](https://github.com/BU-ISCIII/buisciii-tools/pull/299)
 
 ### Modules
 

From 913cbb33b2802564f236ec16fd6fbe3b91aa3f94 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 23 Jul 2024 11:17:41 +0200
Subject: [PATCH 102/321] Added the corresponding \ characters when doing cut

---
 .../mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog        | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
index bc1c80fa8..e5bdac16e 100644
--- a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
+++ b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
@@ -13,9 +13,9 @@ cat ../samples_id.txt | xargs -I @@ echo -e "srun --job-name MTBSEQ.@@  --output
 
 # classification
 echo "mkdir classification_all" > _03_gather_results.sh 
-echo "FIRST_SAMPLE=$(head -n1 ../samples_id.txt); head -n 1 ${FIRST_SAMPLE}/Classification/Strain_Classification.tab > classification_all/strain_classification_all.tab; grep \"^'$analysis_year\" */Classification/Strain_Classification.tab | cut -d ":" -f 2 >> classification_all/strain_classification_all.tab" >> _03_gather_results.sh
+echo "FIRST_SAMPLE=$(head -n1 ../samples_id.txt); head -n 1 ${FIRST_SAMPLE}/Classification/Strain_Classification.tab > classification_all/strain_classification_all.tab; grep \"^'$analysis_year\" */Classification/Strain_Classification.tab | cut -d \":\" -f 2 >> classification_all/strain_classification_all.tab" >> _03_gather_results.sh
 # resistances
 echo "mkdir resistances_all" >> _03_gather_results.sh
 cat ../samples_id.txt | xargs -I % echo "cp %/Amend/NONE_joint_cf4_cr4_fr75_ph4_samples1_amended.tab resistances_all/%_var_res.tab" >> _03_gather_results.sh
 # stats
-echo "mkdir stats_all; FIRST_SAMPLE=$(head -n1 ../samples_id.txt); head -n 1 ${FIRST_SAMPLE}/Statistics/Mapping_and_Variant_Statistics.tab > stats_all/statistics_all.tab; grep \"^'$analysis_year\" */Statistics/Mapping_and_Variant_Statistics.tab | cut -d ":" -f 2 >> stats_all/statistics_all.tab" >> _03_gather_results.sh
+echo "mkdir stats_all; FIRST_SAMPLE=$(head -n1 ../samples_id.txt); head -n 1 ${FIRST_SAMPLE}/Statistics/Mapping_and_Variant_Statistics.tab > stats_all/statistics_all.tab; grep \"^'$analysis_year\" */Statistics/Mapping_and_Variant_Statistics.tab | cut -d \":\" -f 2 >> stats_all/statistics_all.tab" >> _03_gather_results.sh

From 75c4f549efd2b43f772aeec871b44ad07955d05b Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Mon, 29 Jul 2024 15:42:35 +0200
Subject: [PATCH 103/321] Fixed symlink creation in 99-stats folder (MAG).

---
 bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog
index 246dae5d4..f3e40c093 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog
@@ -1,6 +1,6 @@
 #module load singularity
 
-cat ../../samples_id.txt | while read in; do ln -s ../*_mag/Taxonomy/kraken2/${in}/kraken2_report.txt ./${in}_kraken2_report.txt; done
+cat ../../samples_id.txt | while read in; do ln -s ../*_mag/Taxonomy/kraken2/${in}/${in}kraken2_report.txt .; done
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 

From d3385bb2c1f3869fb9333e957a5c3b11ec61c152 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Mon, 29 Jul 2024 15:46:55 +0200
Subject: [PATCH 104/321] Added dot

---
 bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog
index f3e40c093..915ddf942 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog
@@ -1,6 +1,6 @@
 #module load singularity
 
-cat ../../samples_id.txt | while read in; do ln -s ../*_mag/Taxonomy/kraken2/${in}/${in}kraken2_report.txt .; done
+cat ../../samples_id.txt | while read in; do ln -s ../*_mag/Taxonomy/kraken2/${in}/${in}.kraken2_report.txt .; done
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 

From db8306039392e613f538c33a6c16cb8ffe763d91 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Mon, 29 Jul 2024 15:55:01 +0200
Subject: [PATCH 105/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index d82b79be0..974e17a77 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -54,6 +54,7 @@ Code contributions to the new version:
 - Updated assembly, ariba, snippy, amrfinderplus and iqtree templates, removed genomeev and mtbseq_assembly templates and updated services.json [#295](https://github.com/BU-ISCIII/buisciii-tools/pull/295)
 - Changed viralrecon's lablog so that references are available within refgenie [#296](https://github.com/BU-ISCIII/buisciii-tools/pull/296)
 - Updated services.json, mtbseq's lablog, viralrecon's lablog and assembly's config file [#299](https://github.com/BU-ISCIII/buisciii-tools/pull/299)
+- Fixed 99-stats (MAG) template. [#301](https://github.com/BU-ISCIII/buisciii-tools/pull/301)
 
 ### Modules
 

From 8d70a3a7ec37344386eb1dbe2553e7136b80ee1b Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Fri, 26 Jul 2024 16:02:09 +0200
Subject: [PATCH 106/321] added emmtyper template

---
 .../04-emmtyper/lablog                        | 78 +++++++++++++++++++
 1 file changed, 78 insertions(+)
 create mode 100644 bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
new file mode 100644
index 000000000..59033b0ec
--- /dev/null
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
@@ -0,0 +1,78 @@
+#!/bin/sh
+
+# Create folders
+mkdir -p data
+mkdir -p .slurm_logs_NC
+
+# Find all .gz files and write them to a file list
+# TODO: add if to check >1 fasta files are available in assembly results
+# FIXME: set path to assembly files (tmp: assembly template file path)  
+find ../../../../assembly/ANALYSIS/*_ASSEMBLY01/results/assembly/unicycler/*.fasta.gz > data/assembly_file_list.txt
+ASSEMBLY_LIST=data/assembly_file_list.txt
+
+# Get the number of files
+num_files=$(wc -l < $ASSEMBLY_LIST)
+
+scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+
+# STEP 1: Set up jobarray to unzip fasta files
+cat <<EOF > _00_unzip_jobarray.sbatch
+#!/bin/bash
+#SBATCH --job-name=unzip_fasta
+#SBATCH --ntasks=1
+#SBATCH --cpus-per-task=2
+#SBATCH --mem=8G
+#SBATCH --time=2:00:00
+#SBATCH --partition short_idx
+#SBATCH --array=1-$num_files
+#SBATCH --chdir $scratch_dir
+#SBATCH --output .slurm_logs_NC/slurm-%A_%a.out
+#SBATCH --error .slurm_logs_NC/slurm-%A_%a.err
+
+# Get the file to process
+file=\$(sed -n "\${SLURM_ARRAY_TASK_ID}p" $ASSEMBLY_LIST)
+
+# Unzip the file to the destination directory
+gzip -dkc \$file > data/\$(basename "\$file" .gz)
+
+EOF
+
+# FIXME: symb links to BLAST DATABASE?
+# FIXME: conda & singularity load
+# STEP 2: Setup exe file to perform unzip and emmtyper.
+cat <<EOF > _01_emmtyper.sbatch
+#!/bin/bash
+#SBATCH --job-name emmtyper
+#SBATCH --ntasks 1
+#SBATCH --cpus-per-task 4
+#SBATCH --mem 24G
+#SBATCH --time 4:00:00
+#SBATCH --partition short_idx
+#SBATCH --chdir $scratch_dir
+#SBATCH --output ./$(date '+%Y%m%d')_emmtyper.log
+
+# module load singularity
+# conda activate emmtyper-0.2.0
+
+# create results folder
+mkdir -p 01-typing
+mkdir -p 01-typing/tmps
+
+# Run emmtyper
+emmtyper \\
+    -w blast \\
+    --keep \\
+    --blast_db 'path_to_blastdatabase' \\
+    --percent-identity 95 \\
+    --culling-limit 5 \\
+    --output 01-typing/results_emmtyper.out \\
+    --output-format verbose \\
+    ../data/*.fasta
+
+mv *.tmp 01-typing/tmps
+
+EOF
+
+echo "#!/bin/bash" > _ALLSTEPS_emmtyper.sh
+echo "unzip_job_id=\$(sbatch _00_unzip_jobarray.sbatch | awk '{print \$4}')" >> _ALLSTEPS_emmtyper.sh
+echo "sbatch --dependency=afterok:\${unzip_job_id} _01_emmtyper.sbatch" >> _ALLSTEPS_emmtyper.sh

From f5df419a086a1439c70a7afe0d8ebbfda7b5b720 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Mon, 29 Jul 2024 11:22:38 +0200
Subject: [PATCH 107/321] fixing paths and folder names

---
 .../04-emmtyper/lablog                            | 15 +++++++--------
 1 file changed, 7 insertions(+), 8 deletions(-)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
index 59033b0ec..bd6caf0b6 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
@@ -1,14 +1,13 @@
 #!/bin/sh
 
 # Create folders
-mkdir -p data
+mkdir -p data_NC
 mkdir -p .slurm_logs_NC
 
 # Find all .gz files and write them to a file list
 # TODO: add if to check >1 fasta files are available in assembly results
-# FIXME: set path to assembly files (tmp: assembly template file path)  
-find ../../../../assembly/ANALYSIS/*_ASSEMBLY01/results/assembly/unicycler/*.fasta.gz > data/assembly_file_list.txt
-ASSEMBLY_LIST=data/assembly_file_list.txt
+find ../../*ANALYSIS*ASSEMBLY/03-assembly/unicycler/*.fasta.gz > data_NC/assembly_file_list.txt
+ASSEMBLY_LIST=data_NC/assembly_file_list.txt
 
 # Get the number of files
 num_files=$(wc -l < $ASSEMBLY_LIST)
@@ -33,11 +32,10 @@ cat <<EOF > _00_unzip_jobarray.sbatch
 file=\$(sed -n "\${SLURM_ARRAY_TASK_ID}p" $ASSEMBLY_LIST)
 
 # Unzip the file to the destination directory
-gzip -dkc \$file > data/\$(basename "\$file" .gz)
+gzip -dkc \$file > data_NC/\$(basename "\$file" .gz)
 
 EOF
 
-# FIXME: symb links to BLAST DATABASE?
 # FIXME: conda & singularity load
 # STEP 2: Setup exe file to perform unzip and emmtyper.
 cat <<EOF > _01_emmtyper.sbatch
@@ -62,13 +60,14 @@ mkdir -p 01-typing/tmps
 emmtyper \\
     -w blast \\
     --keep \\
-    --blast_db 'path_to_blastdatabase' \\
+    --blast_db '/data/bi/references/cdc_emm_blastdb/cdc_emm_database29042024' \\
     --percent-identity 95 \\
     --culling-limit 5 \\
     --output 01-typing/results_emmtyper.out \\
     --output-format verbose \\
-    ../data/*.fasta
+    ./data_NC/*.fasta
 
+mv *emmtyper.log 01-typing/
 mv *.tmp 01-typing/tmps
 
 EOF

From 806cd2c14dab4d12cd899c577e80255aaca8854f Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Mon, 29 Jul 2024 11:23:21 +0200
Subject: [PATCH 108/321] add emmtyper to results lablog

---
 .../RESULTS/lablog_characterization_results                 | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results b/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results
index a12cfbd96..a3585ea46 100644
--- a/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results
+++ b/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results
@@ -1,6 +1,7 @@
 DELIVERY_FOLDER="$(date '+%Y%m%d')_entrega01"
 
 mkdir -p "${DELIVERY_FOLDER}/characterization/amrfinderplus"
+mkdir -p "${DELIVERY_FOLDER}/characterization/emmtyper"
 
 # ARIBA characterization service
 cd $DELIVERY_FOLDER/characterization
@@ -11,4 +12,7 @@ cd amrfinderplus
 ln -s ../../../../ANALYSIS/*CHARACTERIZATION/*amrfinderplus/*tsv .
 find .. -xtype l -delete
 
-cd ../..
+cd ../emmtyper
+ln -s ../../../../ANALYSIS/*CHARACTERIZATION/*emmtyper/01-typing/results_emmtyper.out .
+
+cd ../../

From e55bb8d5d83fc8bd5da9630c5e0081c90939d1b2 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Mon, 29 Jul 2024 12:11:17 +0200
Subject: [PATCH 109/321] fixed folder name and dir accessing

---
 .../ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog    | 2 +-
 .../characterization/RESULTS/lablog_characterization_results   | 3 ++-
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
index bd6caf0b6..735921f9e 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
@@ -6,7 +6,7 @@ mkdir -p .slurm_logs_NC
 
 # Find all .gz files and write them to a file list
 # TODO: add if to check >1 fasta files are available in assembly results
-find ../../*ANALYSIS*ASSEMBLY/03-assembly/unicycler/*.fasta.gz > data_NC/assembly_file_list.txt
+find ../../*ANALYSIS*ASSEMBLY/*-assembly/unicycler/*.fasta.gz > data_NC/assembly_file_list.txt
 ASSEMBLY_LIST=data_NC/assembly_file_list.txt
 
 # Get the number of files
diff --git a/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results b/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results
index a3585ea46..9d617543a 100644
--- a/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results
+++ b/bu_isciii/templates/characterization/RESULTS/lablog_characterization_results
@@ -12,7 +12,8 @@ cd amrfinderplus
 ln -s ../../../../ANALYSIS/*CHARACTERIZATION/*amrfinderplus/*tsv .
 find .. -xtype l -delete
 
-cd ../emmtyper
+cd ..
+cd emmtyper
 ln -s ../../../../ANALYSIS/*CHARACTERIZATION/*emmtyper/01-typing/results_emmtyper.out .
 
 cd ../../

From f55e7bc1874f034efc036659fb6331362d93da0b Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Mon, 29 Jul 2024 12:11:43 +0200
Subject: [PATCH 110/321] allow emmtyper to run via singularity

---
 .../04-emmtyper/lablog                           | 16 +++++++++++-----
 1 file changed, 11 insertions(+), 5 deletions(-)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
index 735921f9e..7ff21e7a1 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
@@ -36,7 +36,6 @@ gzip -dkc \$file > data_NC/\$(basename "\$file" .gz)
 
 EOF
 
-# FIXME: conda & singularity load
 # STEP 2: Setup exe file to perform unzip and emmtyper.
 cat <<EOF > _01_emmtyper.sbatch
 #!/bin/bash
@@ -50,28 +49,35 @@ cat <<EOF > _01_emmtyper.sbatch
 #SBATCH --output ./$(date '+%Y%m%d')_emmtyper.log
 
 # module load singularity
-# conda activate emmtyper-0.2.0
 
 # create results folder
 mkdir -p 01-typing
 mkdir -p 01-typing/tmps
+blastdb_path=/data/bi/references/cdc_emm_blastdb
 
 # Run emmtyper
-emmtyper \\
+singularity exec \\
+    --bind ${scratch_dir} \\
+    --bind ${scratch_dir}/../../ \\
+    --bind  \$blastdb_path \\
+    /data/bi/pipelines/singularity-images/singularity-emmtyper.0.2.0--py_0 emmtyper \\
     -w blast \\
     --keep \\
-    --blast_db '/data/bi/references/cdc_emm_blastdb/cdc_emm_database29042024' \\
+    --blast_db "${blastdb_path}/cdc_emm_database29042024" \\
     --percent-identity 95 \\
     --culling-limit 5 \\
     --output 01-typing/results_emmtyper.out \\
     --output-format verbose \\
     ./data_NC/*.fasta
 
-mv *emmtyper.log 01-typing/
 mv *.tmp 01-typing/tmps
 
 EOF
 
+# Bash script that performs all steps above
 echo "#!/bin/bash" > _ALLSTEPS_emmtyper.sh
+echo "# # module load singularity" >> _ALLSTEPS_emmtyper.sh
 echo "unzip_job_id=\$(sbatch _00_unzip_jobarray.sbatch | awk '{print \$4}')" >> _ALLSTEPS_emmtyper.sh
 echo "sbatch --dependency=afterok:\${unzip_job_id} _01_emmtyper.sbatch" >> _ALLSTEPS_emmtyper.sh
+
+chmod +x _ALLSTEPS_emmtyper.sh

From 56262a49a9a3363ace4b73a29bacb53abfc132d4 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Mon, 29 Jul 2024 12:25:03 +0200
Subject: [PATCH 111/321] update changelog in #300

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 974e17a77..8641155ed 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -54,6 +54,7 @@ Code contributions to the new version:
 - Updated assembly, ariba, snippy, amrfinderplus and iqtree templates, removed genomeev and mtbseq_assembly templates and updated services.json [#295](https://github.com/BU-ISCIII/buisciii-tools/pull/295)
 - Changed viralrecon's lablog so that references are available within refgenie [#296](https://github.com/BU-ISCIII/buisciii-tools/pull/296)
 - Updated services.json, mtbseq's lablog, viralrecon's lablog and assembly's config file [#299](https://github.com/BU-ISCIII/buisciii-tools/pull/299)
+- Added lablog to automate gene characterization with emmtyper, including unzipping assemblies. [#300](https://github.com/BU-ISCIII/buisciii-tools/pull/300)
 - Fixed 99-stats (MAG) template. [#301](https://github.com/BU-ISCIII/buisciii-tools/pull/301)
 
 ### Modules

From 78554bb9d8bf89d6f3b6740296b110eac7a2b443 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Mon, 29 Jul 2024 13:03:03 +0200
Subject: [PATCH 112/321] added reviewer suggestions in #300

---
 .../04-emmtyper/lablog                           | 16 ++++++++--------
 bu_isciii/templates/services.json                |  2 +-
 2 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
index 7ff21e7a1..a2eec9ce0 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
@@ -1,13 +1,13 @@
 #!/bin/sh
 
 # Create folders
-mkdir -p data_NC
-mkdir -p .slurm_logs_NC
+mkdir -p fasta_inputs
+mkdir -p slurm_logs
 
 # Find all .gz files and write them to a file list
 # TODO: add if to check >1 fasta files are available in assembly results
-find ../../*ANALYSIS*ASSEMBLY/*-assembly/unicycler/*.fasta.gz > data_NC/assembly_file_list.txt
-ASSEMBLY_LIST=data_NC/assembly_file_list.txt
+find ../../*ANALYSIS*ASSEMBLY/*-assembly/unicycler/*.fasta.gz > fasta_inputs/assembly_file_list.txt
+ASSEMBLY_LIST=fasta_inputs/assembly_file_list.txt
 
 # Get the number of files
 num_files=$(wc -l < $ASSEMBLY_LIST)
@@ -25,14 +25,14 @@ cat <<EOF > _00_unzip_jobarray.sbatch
 #SBATCH --partition short_idx
 #SBATCH --array=1-$num_files
 #SBATCH --chdir $scratch_dir
-#SBATCH --output .slurm_logs_NC/slurm-%A_%a.out
-#SBATCH --error .slurm_logs_NC/slurm-%A_%a.err
+#SBATCH --output slurm_logs/slurm-%A_%a.out
+#SBATCH --error slurm_logs/slurm-%A_%a.err
 
 # Get the file to process
 file=\$(sed -n "\${SLURM_ARRAY_TASK_ID}p" $ASSEMBLY_LIST)
 
 # Unzip the file to the destination directory
-gzip -dkc \$file > data_NC/\$(basename "\$file" .gz)
+gzip -dkc \$file > fasta_inputs/\$(basename "\$file" .gz)
 
 EOF
 
@@ -68,7 +68,7 @@ singularity exec \\
     --culling-limit 5 \\
     --output 01-typing/results_emmtyper.out \\
     --output-format verbose \\
-    ./data_NC/*.fasta
+    ./fasta_inputs/*.fasta
 
 mv *.tmp 01-typing/tmps
 
diff --git a/bu_isciii/templates/services.json b/bu_isciii/templates/services.json
index c9e4a108f..3e57d041b 100755
--- a/bu_isciii/templates/services.json
+++ b/bu_isciii/templates/services.json
@@ -198,7 +198,7 @@
         "folders":[],
         "files":[]
       },
-      "no_copy": ["RAW", "TMP", "00-reads"],
+      "no_copy": ["RAW", "TMP", "00-reads", "fasta_inputs"],
       "last_folder":"REFERENCES",
       "delivery_md": "",
       "results_md": ""

From b9f1498ca87dc1b7a933553276b22eb5b3e033aa Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Mon, 29 Jul 2024 13:03:40 +0200
Subject: [PATCH 113/321] fix singularity bind

---
 .../ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog     | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
index a2eec9ce0..c93c8fd6c 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
@@ -63,7 +63,7 @@ singularity exec \\
     /data/bi/pipelines/singularity-images/singularity-emmtyper.0.2.0--py_0 emmtyper \\
     -w blast \\
     --keep \\
-    --blast_db "${blastdb_path}/cdc_emm_database29042024" \\
+    --blast_db "\${blastdb_path}/cdc_emm_database29042024" \\
     --percent-identity 95 \\
     --culling-limit 5 \\
     --output 01-typing/results_emmtyper.out \\

From 2f7fd5e8ef6eacd4ea9cffffee40ff4c1442439b Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Tue, 30 Jul 2024 09:45:11 +0200
Subject: [PATCH 114/321] renamed logs folder

---
 .../ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
index c93c8fd6c..d5897933c 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
@@ -2,7 +2,7 @@
 
 # Create folders
 mkdir -p fasta_inputs
-mkdir -p slurm_logs
+mkdir -p logs
 
 # Find all .gz files and write them to a file list
 # TODO: add if to check >1 fasta files are available in assembly results
@@ -25,8 +25,8 @@ cat <<EOF > _00_unzip_jobarray.sbatch
 #SBATCH --partition short_idx
 #SBATCH --array=1-$num_files
 #SBATCH --chdir $scratch_dir
-#SBATCH --output slurm_logs/slurm-%A_%a.out
-#SBATCH --error slurm_logs/slurm-%A_%a.err
+#SBATCH --output logs/slurm-%A_%a.out
+#SBATCH --error logs/slurm-%A_%a.err
 
 # Get the file to process
 file=\$(sed -n "\${SLURM_ARRAY_TASK_ID}p" $ASSEMBLY_LIST)

From 309dd28bb244401bb16ed956b402f71e1e76cc35 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 1 Aug 2024 14:46:00 +0200
Subject: [PATCH 115/321] Fixed IRMA's lablog so that the info is not displayed
 several times neither within the files of each type nor in
 all_samples_completo.txt

---
 .../IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog          | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)
 mode change 100755 => 100644 bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
old mode 100755
new mode 100644
index c694a5b91..0e7704fe0
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
@@ -5,12 +5,14 @@ mkdir logs
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --cpus-per-task 32 --mem 35000M --chdir $scratch_dir --time 01:00:00 --output logs/IRMA.${in}.%j.log /data/bi/pipelines/flu-amd/flu-amd-1.1.4/IRMA FLU_AD ../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz ${in} --external-config ../../../DOC/irma_config.sh &"; done > _01_irma.sh
+cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --cpus-per-task 32 --mem 35000M --chdir $scratch_dir --time 01:00:00 --output logs/IRMA.${in}.%j.log /data/bi/tmp/pipelines_new/flu-amd/flu-amd-1.1.4/IRMA FLU_AD ../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz ${in} --external-config ../../../DOC/irma_config.sh &"; done > _01_irma.sh
 
 echo 'bash create_irma_stats.sh' > _02_create_stats.sh
 
 echo "ls */*HA*.fasta | cut -d '/' -f2 | cut -d '.' -f1 | sort -u | cut -d '_' -f3  | sed '/^\$/d' | sed 's/^/A_/g' > HA_types.txt" > _03_post_processing.sh
 
+echo 'cat HA_types.txt | while read type; do if test -d ${type}; then rm -rf ${type}; fi; done; if test -d B ; then rm -rf B; fi; if test -d C; then rm -rf C; fi' >> _03_post_processing.sh
+
 echo "cat HA_types.txt | while read in; do mkdir \${in}; done" >> _03_post_processing.sh
 
 echo "if grep -qw 'B__' irma_stats.txt; then mkdir B; fi" >> _03_post_processing.sh

From 790a728fb1d341624147a7f7b6c48927cd78fd45 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 1 Aug 2024 14:50:58 +0200
Subject: [PATCH 116/321] Substituted pipelines_new by pipelines in line 8

---
 .../templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog  | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
index 0e7704fe0..e66a50a9d 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
@@ -5,7 +5,7 @@ mkdir logs
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --cpus-per-task 32 --mem 35000M --chdir $scratch_dir --time 01:00:00 --output logs/IRMA.${in}.%j.log /data/bi/tmp/pipelines_new/flu-amd/flu-amd-1.1.4/IRMA FLU_AD ../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz ${in} --external-config ../../../DOC/irma_config.sh &"; done > _01_irma.sh
+cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --cpus-per-task 32 --mem 35000M --chdir $scratch_dir --time 01:00:00 --output logs/IRMA.${in}.%j.log /data/bi/pipelines/flu-amd/flu-amd-1.1.4/IRMA FLU_AD ../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz ${in} --external-config ../../../DOC/irma_config.sh &"; done > _01_irma.sh
 
 echo 'bash create_irma_stats.sh' > _02_create_stats.sh
 

From 2cf15d9a35a61e8833e1ef6e3e29149f143f1f76 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 1 Aug 2024 14:53:53 +0200
Subject: [PATCH 117/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 8641155ed..6417f4b9b 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -56,6 +56,7 @@ Code contributions to the new version:
 - Updated services.json, mtbseq's lablog, viralrecon's lablog and assembly's config file [#299](https://github.com/BU-ISCIII/buisciii-tools/pull/299)
 - Added lablog to automate gene characterization with emmtyper, including unzipping assemblies. [#300](https://github.com/BU-ISCIII/buisciii-tools/pull/300)
 - Fixed 99-stats (MAG) template. [#301](https://github.com/BU-ISCIII/buisciii-tools/pull/301)
+- Fixed IRMA's lablog so that the sequences of the samples are not displayed several times neither in the .txt files of each influenza type nor in all_samples_completo.txt [#305](https://github.com/BU-ISCIII/buisciii-tools/pull/305)
 
 ### Modules
 

From 8fa9e2a44e09a8fe91e28a4c80b5df1fbfb205bd Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 5 Aug 2024 13:52:13 +0200
Subject: [PATCH 118/321] Added new line to remove all_samples_completo.txt
 before creating it, in case it already existed previously

---
 .../templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog  | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
index e66a50a9d..5e9d933b6 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
@@ -13,6 +13,8 @@ echo "ls */*HA*.fasta | cut -d '/' -f2 | cut -d '.' -f1 | sort -u | cut -d '_' -
 
 echo 'cat HA_types.txt | while read type; do if test -d ${type}; then rm -rf ${type}; fi; done; if test -d B ; then rm -rf B; fi; if test -d C; then rm -rf C; fi' >> _03_post_processing.sh
 
+echo 'if test -f all_samples_completo.txt; then rm all_samples_completo.txt; fi' >> _03_post_processing.sh
+
 echo "cat HA_types.txt | while read in; do mkdir \${in}; done" >> _03_post_processing.sh
 
 echo "if grep -qw 'B__' irma_stats.txt; then mkdir B; fi" >> _03_post_processing.sh

From 4620576ce721db3eea3e17b5644a7c34a131b5a8 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 7 Aug 2024 13:29:10 +0200
Subject: [PATCH 119/321] Modified the email_creation function so that new
 lines are applied when adding the delivery notes into the body of the email

---
 bu_isciii/bioinfo_doc.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index 5583ab8a8..ad7b20a46 100755
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -603,11 +603,11 @@ def email_creation(self):
                 if bu_isciii.utils.prompt_yn_question(
                     f"Do you want to use notes from {self.provided_txt}?", dflt=False
                 ):
-                    email_data["email_notes"] = self.delivery_notes
+                    email_data["email_notes"] = self.delivery_notes.replace("\n", "<br />")
             else:
                 email_data["email_notes"] = bu_isciii.utils.ask_for_some_text(
                     msg="Write email notes"
-                )
+                ).replace("\n", "<br />")
 
         email_data["user_data"] = self.resolution_info["service_user_id"]
         email_data["service_id"] = self.service_name.split("_", 5)[0]

From 66da332950059be6e1af1156405582ee58e5095e Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 7 Aug 2024 13:36:39 +0200
Subject: [PATCH 120/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 6417f4b9b..13c20e788 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -57,6 +57,7 @@ Code contributions to the new version:
 - Added lablog to automate gene characterization with emmtyper, including unzipping assemblies. [#300](https://github.com/BU-ISCIII/buisciii-tools/pull/300)
 - Fixed 99-stats (MAG) template. [#301](https://github.com/BU-ISCIII/buisciii-tools/pull/301)
 - Fixed IRMA's lablog so that the sequences of the samples are not displayed several times neither in the .txt files of each influenza type nor in all_samples_completo.txt [#305](https://github.com/BU-ISCIII/buisciii-tools/pull/305)
+- Modified bioinfo_doc.py so that new lines in the delivery message are applied in the email [#307](https://github.com/BU-ISCIII/buisciii-tools/pull/307)
 
 ### Modules
 

From f209cead765c767b629d483c398197f1390cd479 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 8 Aug 2024 11:44:22 +0200
Subject: [PATCH 121/321] Ran black --check and black commands so that
 black_lint does not fail

---
 bu_isciii/bioinfo_doc.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index ad7b20a46..37512a40e 100755
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -603,7 +603,9 @@ def email_creation(self):
                 if bu_isciii.utils.prompt_yn_question(
                     f"Do you want to use notes from {self.provided_txt}?", dflt=False
                 ):
-                    email_data["email_notes"] = self.delivery_notes.replace("\n", "<br />")
+                    email_data["email_notes"] = self.delivery_notes.replace(
+                        "\n", "<br />"
+                    )
             else:
                 email_data["email_notes"] = bu_isciii.utils.ask_for_some_text(
                     msg="Write email notes"

From e72dfbc42be47e800c52d348e70428368d1674dd Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Fri, 2 Aug 2024 16:25:18 +0200
Subject: [PATCH 122/321] Added log to pangolin-data update stage. Added check
 for correct update

---
 .../viralrecon/ANALYSIS/lablog_viralrecon        | 16 ++++++++++------
 1 file changed, 10 insertions(+), 6 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index a98cf487f..6ae5230da 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -16,7 +16,7 @@ The functions performed by the script can be listed as follows:
 - Checking of the last available version of the Pangolin container. Download if necessary. Database update. File configuration.
 - Checking the last available version of the Nextclade container. Download if necessary. Extraction of the tag for the
   analysis dataset. File configuration.
-- Checking of required references (fasta and gff) and downloading of from NCBI if necessary.
+- Checking if required references (fasta and gff) are locally available and downloading them from NCBI if necessary.
 - Creation of the necessary directories for the analysis hosts, and subdirectories for each of the references.
 
 '
@@ -65,11 +65,15 @@ update_pangolin() {
         echo -e "Pangolin database is UP TO DATE. \xE2\x9C\x85"
     else
         mkdir "$(date '+%Y%m%d')"
-        srun --partition short_idx singularity run -B ${PWD} /data/bi/pipelines/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/
-        # log file creation
-        echo -e "$(date +'%Y-%m-%d %H:%M:%S')\tmkdir $(date '+%Y%m%d')" >> $(date '+%Y%m%d')/log
-        echo -e "$(date +'%Y-%m-%d %H:%M:%S')\tsrun --partition short_idx singularity run -B ${PWD} /data/bi/pipelines/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/)" >> $(date '+%Y%m%d')/log
-        echo_green "Pangolin database UPDATED."
+        echo -e "$(date +'%Y-%m-%d %H:%M:%S')\tmkdir $(date '+%Y%m%d')" >> $(date '+%Y%m%d')/command.log
+        echo -e "$(date +'%Y-%m-%d %H:%M:%S')\tsrun --partition short_idx --output ${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log singularity run -B ${PWD} /data/bi/pipelines/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/)" >> $(date '+%Y%m%d')/command.log
+        srun --partition short_idx --output ${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log singularity run -B ${PWD} /data/bi/pipelines/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/
+        if [ $? -eq 0 ]; then
+            echo_green "$(grep pangolin "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"
+            echo_green "$(grep constellations "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"
+        else
+            echo_blinking_red "Error during pangolin database update."
+        fi
     fi
     cd -
 

From 3f1d9fb197e1c0395b9097a230fc60313afa3c51 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Fri, 2 Aug 2024 16:28:00 +0200
Subject: [PATCH 123/321] Fixed typo

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 6ae5230da..0de45e34a 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -255,7 +255,7 @@ done
 
 echo_bold "\nPlease specify the method to be performed."
     echo_bold "1. Mapping"
-    echo_bold "2. De novo assemby"
+    echo_bold "2. De novo assembly"
     echo_bold "3. Both"
     while true; do
         echo -ne "\e[1;38;5;220m"; read -n 1 method; tput sgr0; echo

From c3e5dc6817b1feec02a806daf543d12277465a86 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Fri, 2 Aug 2024 16:49:17 +0200
Subject: [PATCH 124/321] Enabled module load singularity inside of the lablog

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 0de45e34a..7ca50950b 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -21,7 +21,7 @@ The functions performed by the script can be listed as follows:
 
 '
 
-# module load singularity
+module load singularity
 
 # If there is more than 1 reference, please prepare the samples_ref.txt file before running this lablog.
 

From 8675931eeca3a442fd9a34df3555b7c5b1618dca Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Mon, 5 Aug 2024 12:15:27 +0200
Subject: [PATCH 125/321] Moved nextclade_dataset_tag and
 nextclade_dataset_name inside sbatch file istead of PARAMS_FILE

---
 .../viralrecon/ANALYSIS/lablog_viralrecon     | 26 ++++++++++---------
 1 file changed, 14 insertions(+), 12 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 7ca50950b..e6ec4dced 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -128,9 +128,7 @@ update_nextclade() {
     # Updating params file
     echo "Updating $PARAMS_FILE file..."
     sed -i "s|skip_nextclade: true|skip_nextclade: false|" "$PARAMS_FILE"
-    echo "nextclade_dataset_name: '$virus_tag'" >> $PARAMS_FILE
     echo "nextclade_dataset: false" >> $PARAMS_FILE
-    echo "nextclade_dataset_tag: '$nextclade_tag'" >> $PARAMS_FILE
     echo_bold "File $PARAMS_FILE UPDATED."
 
     echo_bold "Finished NEXTCLADE check/update"
@@ -348,7 +346,6 @@ else
     elif [ "$virus_tag" == "rsv" ]; then       
         # Update Nextclade
         update_nextclade
-        sed -i '/^nextclade_dataset_name/d' $PARAMS_FILE
 
         echo_bold "\nRemember to provide the complete route to primer_bed and primer_fasta files, and specify the nextclade_dataset_name in every sbatch file before running the pipeline."
 
@@ -398,15 +395,20 @@ do
         echo "          --outdir ${ref}_$(date '+%Y%m%d')_viralrecon_mapping \\\\" >> ${FOLDER_NAME}/lablog
         echo "          --fasta ${REF_FASTA} \\\\" >> ${FOLDER_NAME}/lablog
         echo "          --gff ${REF_GFF} \\\\" >> ${FOLDER_NAME}/lablog
-        if [ "$virus_tag" == 'rsv' ]; then
-            echo "          --primer_bed ../../REFERENCES/XXXX \\\\" >> ${FOLDER_NAME}/lablog
-            echo "          --primer_fasta ../../REFERENCES/XXXX \\\\" >> ${FOLDER_NAME}/lablog
-            if [ $ref == "EPI_ISL_18668201" ]; then
-                echo "          --nextclade_dataset_name 'rsv_a' \\\\" >> ${FOLDER_NAME}/lablog
-            elif [ $ref == "EPI_ISL_1653999" ]; then
-                echo "          --nextclade_dataset_name 'rsv_b' \\\\" >> ${FOLDER_NAME}/lablog
-            else
-                echo "          --nextclade_dataset_name 'rsv_X' \\\\" >> ${FOLDER_NAME}/lablog
+        if [ -n "$virus_tag" ]; then
+            echo "          --nextclade_dataset_tag '$nextclade_tag' \\\\" >> ${FOLDER_NAME}/lablog
+            if [ "$virus_tag" == 'rsv' ]; then
+                echo "          --primer_bed ../../REFERENCES/XXXX \\\\" >> ${FOLDER_NAME}/lablog
+                echo "          --primer_fasta ../../REFERENCES/XXXX \\\\" >> ${FOLDER_NAME}/lablog
+                if [ $ref == "EPI_ISL_18668201" ]; then
+                    echo "          --nextclade_dataset_name 'rsv_a' \\\\" >> ${FOLDER_NAME}/lablog
+                elif [ $ref == "EPI_ISL_1653999" ]; then
+                    echo "          --nextclade_dataset_name 'rsv_b' \\\\" >> ${FOLDER_NAME}/lablog
+                else
+                    echo "          --nextclade_dataset_name 'rsv_X' \\\\" >> ${FOLDER_NAME}/lablog
+                fi
+            else 
+                echo "          --nextclade_dataset_name '$virus_tag' \\\\" >> ${FOLDER_NAME}/lablog
             fi
         fi
         echo "          -resume" >> ${FOLDER_NAME}/lablog

From 6879896377b2ed55511a49054e60fc80c053750e Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Tue, 6 Aug 2024 09:54:42 +0200
Subject: [PATCH 126/321] Added singularity module load check and screen
 confirmation messages

---
 .../templates/viralrecon/ANALYSIS/lablog_viralrecon   | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index e6ec4dced..4a84b3f15 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -21,7 +21,6 @@ The functions performed by the script can be listed as follows:
 
 '
 
-module load singularity
 
 # If there is more than 1 reference, please prepare the samples_ref.txt file before running this lablog.
 
@@ -34,6 +33,16 @@ echo_red() { echo -e "\e[31m$1\e[0m"; }
 echo_green() { echo -e "\e[32m$1\e[0m"; }
 echo_blinking_red() { echo -e "\e[1;5;97;5;41m$1\e[0m"; }
 
+# Loading singularity module
+module load singularity
+singularity_loaded=$(module list | grep singularity | awk '{print $2}')
+if [ -n "$singularity_loaded" ]; then
+    echo_green "$singularity_loaded module succesfully loaded."
+else
+    echo_blinking_red "Singularity module not loaded. Exiting..."
+    exit 1
+fi
+
 
 # Updating pangolin. Checks last image available and if is already downloaded. If not, downloads it. This function also updates pangolin database. Update related config files with pangolin info
 update_pangolin() {

From 5738917285e2c04fa0b5a63363d867a5e78d6da5 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Tue, 6 Aug 2024 10:57:50 +0200
Subject: [PATCH 127/321] Modified name of fasta and gff files (family instead
 ref) when using refgenie add function

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 4a84b3f15..25d958530 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -176,7 +176,7 @@ check_references() {
             wget -q -O "/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
             if [ $? -eq 0 ]; then
                 echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}"
-                refgenie add ${family}/fasta:${ref} --path data/${digest}/fasta/${ref}/ --seek-keys '{"fasta" : "'"${ref}.fasta"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+                refgenie add ${family}/fasta:${ref} --path data/${digest}/fasta/${ref}/ --seek-keys '{"fasta" : "'"${family}.fasta"'"}' -c /data/bi/references/refgenie/genome_config.yaml
                 REF_FASTA=$(refgenie seek ${family}/fasta.fasta:${ref} -c /data/bi/references/refgenie/genome_config.yaml)
             else
                 echo_blinking_red "An error occurred during file downloading."
@@ -188,7 +188,7 @@ check_references() {
             wget -q -O "/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
             if [ $? -eq 0 ]; then 
                 echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}"
-                refgenie add ${family}/fasta:${ref} --path data/${digest}/fasta/${ref}/ --seek-keys '{"fasta" : "'"${ref}.fasta"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+                refgenie add ${family}/fasta:${ref} --path data/${digest}/fasta/${ref}/ --seek-keys '{"fasta" : "'"${family}.fasta"'"}' -c /data/bi/references/refgenie/genome_config.yaml
                 REF_FASTA=$(refgenie seek ${family}/fasta.fasta:${ref} -c /data/bi/references/refgenie/genome_config.yaml)
             else
                 echo_blinking_red "An error occurred during file downloading."
@@ -211,7 +211,7 @@ check_references() {
             wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${ref}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
             if [ $? -eq 0 ]; then
                 echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}"
-                refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${ref}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+                refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
                 REF_GFF=$(refgenie seek ${family}/gff.gff:${ref} -c /data/bi/references/refgenie/genome_config.yaml)
             else
                 echo_blinking_red "An error occurred during file downloading."
@@ -223,7 +223,7 @@ check_references() {
             wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${ref}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
             if [ $? -eq 0 ]; then 
                 echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}"
-                refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${ref}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+                refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
                 REF_GFF=$(refgenie seek ${family}/gff.gff:${ref} -c /data/bi/references/refgenie/genome_config.yaml)
             else
                 echo_blinking_red "An error occurred during file downloading."

From 8e412a7a6b9de884c9464e52821dd8dab6f7cbbc Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Tue, 6 Aug 2024 11:14:59 +0200
Subject: [PATCH 128/321] Updated path for artic SARS primer.bed inside
 refgenie folder

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 25d958530..400f6220c 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -350,7 +350,7 @@ else
         update_nextclade
         update_pangolin
 
-        echo "primer_bed: '/data/bi/references/virus/2019-nCoV/amplicons/NC_045512.2/V4.1/artic_v4-1_ncov-2019-primer.scheme.bed'" >> $PARAMS_FILE
+        echo "primer_bed: '/data/bi/references/refgenie/alias/coronaviridae/primer_schemes/NC_045512.2/artic_v4-1_ncov-2019-primer.scheme.bed'" >> $PARAMS_FILE
 
     elif [ "$virus_tag" == "rsv" ]; then       
         # Update Nextclade

From 9ad6d573c7203c47461730a836283a8ccde9f5ea Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Tue, 6 Aug 2024 12:30:01 +0200
Subject: [PATCH 129/321] Moved obtain_family function inside if statement, in
 order to use it just when it is necessary

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 400f6220c..e50efbc49 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -164,10 +164,10 @@ check_references() {
     }
 
     # Check if FASTA sequence is already downloaded
-    obtain_family; if [ -z $family ]; then return; fi
     REF_FASTA=$(refgenie seek ${family}/fasta.fasta:${ref} -c /data/bi/references/refgenie/genome_config.yaml 2>&1)
     if echo "$REF_FASTA" | grep -q "Traceback"; then
         echo "File ${ref}.fasta is not yet downloaded."
+        obtain_family; if [ -z $family ]; then return; fi
         if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exists
             echo "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.fasta in /data/bi/references/refgenie/alias/${family}/fasta/${ref}."
             digest=$(openssl rand -hex 24)
@@ -199,10 +199,10 @@ check_references() {
     fi
 
     # Check if GFF file is already downloaded
-    if [ ! -v family ]; then obtain_family; if [ -z ${family} ]; then return; fi; fi
     REF_GFF=$(refgenie seek ${family}/gff.gff:${ref} -c /data/bi/references/refgenie/genome_config.yaml 2>&1)
-    if echo "$REF_GFF" | grep -q "Traceback"; then 
-        echo "File ${ref}.gff is not yet downloaded."        
+    if echo "$REF_GFF" | grep -q "Traceback"; then
+        echo "File ${ref}.gff is not yet downloaded."
+        if [ ! -v family ]; then obtain_family; if [ -z ${family} ]; then return; fi; fi
         if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exist
             echo "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.gff in /data/bi/references/refgenie/alias/${family}/gff/${ref}."
             digest=$(openssl rand -hex 24)

From 74896c3041348b65b9ce2ddf816675a76c306885 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Tue, 6 Aug 2024 13:06:59 +0200
Subject: [PATCH 130/321] Modified the way the references are finded.
 Substituted refgenie seek for awk in references.txt. Added regeneration of
 references.txt when new references are included

---
 .../viralrecon/ANALYSIS/lablog_viralrecon     | 20 +++++++++++--------
 1 file changed, 12 insertions(+), 8 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index e50efbc49..77ab1d0b5 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -164,8 +164,8 @@ check_references() {
     }
 
     # Check if FASTA sequence is already downloaded
-    REF_FASTA=$(refgenie seek ${family}/fasta.fasta:${ref} -c /data/bi/references/refgenie/genome_config.yaml 2>&1)
-    if echo "$REF_FASTA" | grep -q "Traceback"; then
+    REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+    if [ -z "$REF_FASTA" ]; then
         echo "File ${ref}.fasta is not yet downloaded."
         obtain_family; if [ -z $family ]; then return; fi
         if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exists
@@ -177,7 +177,8 @@ check_references() {
             if [ $? -eq 0 ]; then
                 echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}"
                 refgenie add ${family}/fasta:${ref} --path data/${digest}/fasta/${ref}/ --seek-keys '{"fasta" : "'"${family}.fasta"'"}' -c /data/bi/references/refgenie/genome_config.yaml
-                REF_FASTA=$(refgenie seek ${family}/fasta.fasta:${ref} -c /data/bi/references/refgenie/genome_config.yaml)
+                bash /data/bi/references/refgenie/alias/ref.sh
+                REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
             else
                 echo_blinking_red "An error occurred during file downloading."
             fi
@@ -189,7 +190,8 @@ check_references() {
             if [ $? -eq 0 ]; then 
                 echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}"
                 refgenie add ${family}/fasta:${ref} --path data/${digest}/fasta/${ref}/ --seek-keys '{"fasta" : "'"${family}.fasta"'"}' -c /data/bi/references/refgenie/genome_config.yaml
-                REF_FASTA=$(refgenie seek ${family}/fasta.fasta:${ref} -c /data/bi/references/refgenie/genome_config.yaml)
+                bash /data/bi/references/refgenie/alias/ref.sh
+                REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
             else
                 echo_blinking_red "An error occurred during file downloading."
             fi
@@ -199,8 +201,8 @@ check_references() {
     fi
 
     # Check if GFF file is already downloaded
-    REF_GFF=$(refgenie seek ${family}/gff.gff:${ref} -c /data/bi/references/refgenie/genome_config.yaml 2>&1)
-    if echo "$REF_GFF" | grep -q "Traceback"; then
+    REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+    if [ -z "$REF_GFF" ]; then
         echo "File ${ref}.gff is not yet downloaded."
         if [ ! -v family ]; then obtain_family; if [ -z ${family} ]; then return; fi; fi
         if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exist
@@ -212,7 +214,8 @@ check_references() {
             if [ $? -eq 0 ]; then
                 echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}"
                 refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
-                REF_GFF=$(refgenie seek ${family}/gff.gff:${ref} -c /data/bi/references/refgenie/genome_config.yaml)
+                bash /data/bi/references/refgenie/alias/ref.sh
+                REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
             else
                 echo_blinking_red "An error occurred during file downloading."
             fi
@@ -224,7 +227,8 @@ check_references() {
             if [ $? -eq 0 ]; then 
                 echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}"
                 refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
-                REF_GFF=$(refgenie seek ${family}/gff.gff:${ref} -c /data/bi/references/refgenie/genome_config.yaml)
+                bash /data/bi/references/refgenie/alias/ref.sh
+                REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
             else
                 echo_blinking_red "An error occurred during file downloading."
             fi

From 5a026a25792b10a36c262ee1d2689f1fcb4465fd Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Tue, 6 Aug 2024 13:37:03 +0200
Subject: [PATCH 131/321] Added copy stage for config and params files and
 added date and time to filenames in order to regenerate this config files
 when this lablog is run more than one time, por several analysis

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 77ab1d0b5..07946196e 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -242,8 +242,11 @@ check_references() {
 ####################################
 
 # Setting work variables
-CONFIG_FILE="../DOC/viralrecon.config"
-PARAMS_FILE="../DOC/viralrecon_params.yml"
+timeset=$(date +"%Y-%m-%d_%H-%M-%S")_
+cp ../DOC/viralrecon.config ../DOC/${timeset}_viralrecon.config
+cp ../DOC/viralrecon_params.yml ../DOC/${timeset}_viralrecon_params.yml
+CONFIG_FILE="../DOC/${timeset}_viralrecon.config"
+PARAMS_FILE="../DOC/${timeset}_viralrecon_params.yml"
 
 # Setting the type of analysis
 echo_bold "\nPlease specify the type of analysis."

From ceb0e062e910ac18b650d03789683d2610b851e7 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Tue, 6 Aug 2024 15:45:07 +0200
Subject: [PATCH 132/321] Substituted refgenie add by refgenie build when
 including new references. Added SAMtools module loading

---
 .../viralrecon/ANALYSIS/lablog_viralrecon      | 18 ++++++++++++++----
 1 file changed, 14 insertions(+), 4 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 07946196e..ade96b6b0 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -34,6 +34,7 @@ echo_green() { echo -e "\e[32m$1\e[0m"; }
 echo_blinking_red() { echo -e "\e[1;5;97;5;41m$1\e[0m"; }
 
 # Loading singularity module
+module purge
 module load singularity
 singularity_loaded=$(module list | grep singularity | awk '{print $2}')
 if [ -n "$singularity_loaded" ]; then
@@ -168,15 +169,24 @@ check_references() {
     if [ -z "$REF_FASTA" ]; then
         echo "File ${ref}.fasta is not yet downloaded."
         obtain_family; if [ -z $family ]; then return; fi
+        # Loading SAMtools module
+        module load SAMtools
+        SAMtools_loaded=$(module list | grep -o 'SAMtools/[0-9.]\+-GCC-[0-9.]\+')
+        if [ -n "$SAMtools_loaded" ]; then
+            echo_green "$SAMtools_loaded module succesfully loaded."
+        else
+            echo_blinking_red "SAMtools module not loaded. Exiting..."
+            exit 1
+        fi
         if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exists
             echo "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.fasta in /data/bi/references/refgenie/alias/${family}/fasta/${ref}."
             digest=$(openssl rand -hex 24)
-            refgenie alias set --aliases ${family} --digest ${digest} -f -c /data/bi/references/refgenie/genome_config.yaml
             mkdir -p /data/bi/references/refgenie/data/${digest}/fasta/${ref}/
             wget -q -O "/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
             if [ $? -eq 0 ]; then
                 echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}"
-                refgenie add ${family}/fasta:${ref} --path data/${digest}/fasta/${ref}/ --seek-keys '{"fasta" : "'"${family}.fasta"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+                gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
+                refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R
                 bash /data/bi/references/refgenie/alias/ref.sh
                 REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
             else
@@ -189,8 +199,8 @@ check_references() {
             wget -q -O "/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
             if [ $? -eq 0 ]; then 
                 echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}"
-                refgenie add ${family}/fasta:${ref} --path data/${digest}/fasta/${ref}/ --seek-keys '{"fasta" : "'"${family}.fasta"'"}' -c /data/bi/references/refgenie/genome_config.yaml
-                bash /data/bi/references/refgenie/alias/ref.sh
+                gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
+                refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R                bash /data/bi/references/refgenie/alias/ref.sh
                 REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
             else
                 echo_blinking_red "An error occurred during file downloading."

From 8115d72a7d300f44311e3681c06c4b565810b2e0 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Tue, 6 Aug 2024 17:15:16 +0200
Subject: [PATCH 133/321] Modified final message. Moved module load singularity
 stage outside defining functions area

---
 .../viralrecon/ANALYSIS/lablog_viralrecon     | 28 +++++++++++--------
 1 file changed, 16 insertions(+), 12 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index ade96b6b0..d33037a0a 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -33,17 +33,6 @@ echo_red() { echo -e "\e[31m$1\e[0m"; }
 echo_green() { echo -e "\e[32m$1\e[0m"; }
 echo_blinking_red() { echo -e "\e[1;5;97;5;41m$1\e[0m"; }
 
-# Loading singularity module
-module purge
-module load singularity
-singularity_loaded=$(module list | grep singularity | awk '{print $2}')
-if [ -n "$singularity_loaded" ]; then
-    echo_green "$singularity_loaded module succesfully loaded."
-else
-    echo_blinking_red "Singularity module not loaded. Exiting..."
-    exit 1
-fi
-
 
 # Updating pangolin. Checks last image available and if is already downloaded. If not, downloads it. This function also updates pangolin database. Update related config files with pangolin info
 update_pangolin() {
@@ -251,12 +240,27 @@ check_references() {
 }
 ####################################
 
+# Loading singularity module
+module purge
+module load singularity
+singularity_loaded=$(module list | grep singularity | awk '{print $2}')
+if [ -n "$singularity_loaded" ]; then
+    echo_green "$singularity_loaded module succesfully loaded."
+    echo -e "$(date +'%Y-%m-%d %H:%M:%S')\t${singularity_loaded} module succesfully loaded." >> $(date '+%Y%m%d')/command.log
+else
+    echo_blinking_red "Singularity module not loaded. Exiting..."
+    exit 1
+fi
+
 # Setting work variables
 timeset=$(date +"%Y-%m-%d_%H-%M-%S")_
 cp ../DOC/viralrecon.config ../DOC/${timeset}_viralrecon.config
 cp ../DOC/viralrecon_params.yml ../DOC/${timeset}_viralrecon_params.yml
 CONFIG_FILE="../DOC/${timeset}_viralrecon.config"
 PARAMS_FILE="../DOC/${timeset}_viralrecon_params.yml"
+echo "Created $CONFIG_FILE file."
+echo "Created $PARAMS_FILE file."
+echo
 
 # Setting the type of analysis
 echo_bold "\nPlease specify the type of analysis."
@@ -459,4 +463,4 @@ rm percentajeNs.py
 rm _02_create_run_percentage_Ns.sh
 cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R1*.fastq.gz %_R1.fastq.gz" | bash; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R2*.fastq.gz %_R2.fastq.gz" | bash; cd ..
 
-echo_green "\nLablog_viralrecon execution has been completed successfully!"
+echo_green "\nLablog_viralrecon execution has been completed. Please verify all the configurations are set up correctly."

From c3188b3750fff10aa1b93f7773ca49eb38189c7d Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Tue, 6 Aug 2024 17:48:27 +0200
Subject: [PATCH 134/321] Created lablog_viralrecon.log

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index d33037a0a..468e8cd6a 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -24,6 +24,9 @@ The functions performed by the script can be listed as follows:
 
 # If there is more than 1 reference, please prepare the samples_ref.txt file before running this lablog.
 
+echo "Starting lablog_viralrecon execution."
+echo -e "$(date +'%Y-%m-%d %H:%M:%S')\tStarting lablog_viralrecon execution." > lablog_viralrecon.log
+
 ####################################
 # Defining functions
 
@@ -38,6 +41,7 @@ echo_blinking_red() { echo -e "\e[1;5;97;5;41m$1\e[0m"; }
 update_pangolin() {
     echo
     echo_bold "Starting PANGOLIN check/update."
+    echo -e "$(date +'%Y-%m-%d %H:%M:%S')\tStarting lablog_viralrecon execution." >> lablog_viralrecon.log
     echo "Checking Pangolin container version..."
     url=$(curl -s "https://depot.galaxyproject.org/singularity/")
     latest_version_pangolin=$(echo "$url" | grep -oP 'pangolin:[^"]+' | sort -V | tail -n 1 | awk -F'>' '{print $1}' | sed 's/<\/a//')
@@ -246,7 +250,7 @@ module load singularity
 singularity_loaded=$(module list | grep singularity | awk '{print $2}')
 if [ -n "$singularity_loaded" ]; then
     echo_green "$singularity_loaded module succesfully loaded."
-    echo -e "$(date +'%Y-%m-%d %H:%M:%S')\t${singularity_loaded} module succesfully loaded." >> $(date '+%Y%m%d')/command.log
+    echo -e "$(date +'%Y-%m-%d %H:%M:%S')\t${singularity_loaded} module succesfully loaded." >> lablog_viralrecon.log
 else
     echo_blinking_red "Singularity module not loaded. Exiting..."
     exit 1

From a3196c623eaeba3ed1ac31608c1daa1bf9a47d16 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Wed, 7 Aug 2024 09:10:05 +0200
Subject: [PATCH 135/321] Added log_message function

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 468e8cd6a..e668e0673 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -30,6 +30,13 @@ echo -e "$(date +'%Y-%m-%d %H:%M:%S')\tStarting lablog_viralrecon execution." >
 ####################################
 # Defining functions
 
+# Log message saving
+log_message() {
+    local message="$1"
+    echo "$(date '+%Y-%m-%d %H:%M:%S') - $message" >> ./lablog_viralrecon.log
+}
+
+
 # Coloring messages
 echo_bold() { echo -e "\e[1;37m$1\e[0m"; }
 echo_red() { echo -e "\e[31m$1\e[0m"; }

From b7cfcc3670dee256721974c7b7166fcbdf92f5e7 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Wed, 7 Aug 2024 09:56:51 +0200
Subject: [PATCH 136/321] Added log_message to every message in the lablog

---
 .../viralrecon/ANALYSIS/lablog_viralrecon     | 155 ++++++++++--------
 1 file changed, 85 insertions(+), 70 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index e668e0673..47b8ebf7e 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -24,8 +24,6 @@ The functions performed by the script can be listed as follows:
 
 # If there is more than 1 reference, please prepare the samples_ref.txt file before running this lablog.
 
-echo "Starting lablog_viralrecon execution."
-echo -e "$(date +'%Y-%m-%d %H:%M:%S')\tStarting lablog_viralrecon execution." > lablog_viralrecon.log
 
 ####################################
 # Defining functions
@@ -33,7 +31,7 @@ echo -e "$(date +'%Y-%m-%d %H:%M:%S')\tStarting lablog_viralrecon execution." >
 # Log message saving
 log_message() {
     local message="$1"
-    echo "$(date '+%Y-%m-%d %H:%M:%S') - $message" >> ./lablog_viralrecon.log
+    echo -e "$(date '+%Y-%m-%d %H:%M:%S') - $message" >> lablog_viralrecon.log
 }
 
 
@@ -47,219 +45,233 @@ echo_blinking_red() { echo -e "\e[1;5;97;5;41m$1\e[0m"; }
 # Updating pangolin. Checks last image available and if is already downloaded. If not, downloads it. This function also updates pangolin database. Update related config files with pangolin info
 update_pangolin() {
     echo
-    echo_bold "Starting PANGOLIN check/update."
-    echo -e "$(date +'%Y-%m-%d %H:%M:%S')\tStarting lablog_viralrecon execution." >> lablog_viralrecon.log
-    echo "Checking Pangolin container version..."
+    echo_bold "Starting PANGOLIN check/update."; log_message "Starting PANGOLIN check/update."
+    echo "Checking Pangolin container version..."; log_message "Checking Pangolin container version..."
     url=$(curl -s "https://depot.galaxyproject.org/singularity/")
     latest_version_pangolin=$(echo "$url" | grep -oP 'pangolin:[^"]+' | sort -V | tail -n 1 | awk -F'>' '{print $1}' | sed 's/<\/a//')
     echo_bold "Latest version available of Pangolin:\e[1;38;5;220m $latest_version_pangolin"; tput sgr0
+    log_message "Latest version available of Pangolin: $latest_version_pangolin"
 
-    echo "Checking if latest version of Pangolin image is already downloaded..."
+    echo "Checking if latest version of Pangolin image is already downloaded..."; log_message "Checking if latest version of Pangolin image is already downloaded..."
     if [ -e "/data/bi/pipelines/singularity-images/$latest_version_pangolin" ]; then
-        echo "File $latest_version_pangolin already downloaded."
-        echo -e "Pangolin container is UP TO DATE. \xE2\x9C\x85"
+        echo "File $latest_version_pangolin already downloaded."; log_message "File $latest_version_pangolin already downloaded."
+        echo -e "Pangolin container is UP TO DATE. \xE2\x9C\x85"; log_message "Pangolin container is UP TO DATE. \xE2\x9C\x85"
     else
-        echo "Downloading $latest_version_pangolin file..."
+        echo "Downloading $latest_version_pangolin file..."; log_message "Downloading $latest_version_pangolin file..."
         wget -P "/data/bi/pipelines/singularity-images/" "https://depot.galaxyproject.org/singularity/$latest_version_pangolin"
         if [ $? -eq 0 ]; then
-            echo_green "$latest_version_pangolin file succesfully downloaded."
+            echo_green "$latest_version_pangolin file succesfully downloaded."; log_message "$latest_version_pangolin file succesfully downloaded."
         else
-            echo_blinking_red "An error occurred during file downloading."
+            echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
         fi
     fi
 
     # Updating Pangolin database
-    echo "Setting datadir for Pangolin database."
+    echo "Setting datadir for Pangolin database."; log_message "Setting datadir for Pangolin database."
     cd /data/bi/references/pangolin/
     if [ -e "./$(date '+%Y%m%d')" ]; then
-        echo -e "Pangolin database is UP TO DATE. \xE2\x9C\x85"
+        echo -e "Pangolin database is UP TO DATE. \xE2\x9C\x85"; log_message "Pangolin database is UP TO DATE. \xE2\x9C\x85"
     else
         mkdir "$(date '+%Y%m%d')"
-        echo -e "$(date +'%Y-%m-%d %H:%M:%S')\tmkdir $(date '+%Y%m%d')" >> $(date '+%Y%m%d')/command.log
-        echo -e "$(date +'%Y-%m-%d %H:%M:%S')\tsrun --partition short_idx --output ${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log singularity run -B ${PWD} /data/bi/pipelines/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/)" >> $(date '+%Y%m%d')/command.log
+        echo -e "$(date +'%Y-%m-%d %H:%M:%S') - mkdir $(date '+%Y%m%d')" >> $(date '+%Y%m%d')/command.log
+        echo -e "$(date +'%Y-%m-%d %H:%M:%S') - srun --partition short_idx --output ${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log singularity run -B ${PWD} /data/bi/pipelines/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/)" >> $(date '+%Y%m%d')/command.log
         srun --partition short_idx --output ${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log singularity run -B ${PWD} /data/bi/pipelines/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/
         if [ $? -eq 0 ]; then
-            echo_green "$(grep pangolin "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"
-            echo_green "$(grep constellations "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"
+            echo_green "$(grep pangolin "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"; log_message "$(grep pangolin "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"
+            echo_green "$(grep constellations "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"; log_message "$(grep constellations "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"
         else
-            echo_blinking_red "Error during pangolin database update."
+            echo_blinking_red "Error during pangolin database update."; log_message "Error during pangolin database update."
         fi
     fi
     cd -
 
     # Updating config file
-    echo "Updating $CONFIG_FILE file..."
+    echo "Updating $CONFIG_FILE file..."; log_message "Updating $CONFIG_FILE file..."
     sed -i "s|pangolin:4.3--pyhdfd78af_2|$latest_version_pangolin|" "$CONFIG_FILE"
     sed -i "s|--datadir XXXX|--datadir $(ls -dt /data/bi/references/pangolin/*/ | head -n 1)|" "$CONFIG_FILE"
-    echo_bold "File $CONFIG_FILE UPDATED."
+    echo_bold "File $CONFIG_FILE UPDATED."; log_message "File $CONFIG_FILE UPDATED."
 
     # Updating params file
-    echo "Updating $PARAMS_FILE file..."
+    echo "Updating $PARAMS_FILE file..."; log_message "Updating $PARAMS_FILE file..."
     sed -i "s|skip_pangolin: true|skip_pangolin: false|" "$PARAMS_FILE"
-    echo_bold "File $PARAMS_FILE UPDATED."
+    echo_bold "File $PARAMS_FILE UPDATED."; log_message "File $PARAMS_FILE UPDATED."
 
-    echo_bold "Finished PANGOLIN check/update"
+    echo_bold "Finished PANGOLIN check/update"; log_message "Finished PANGOLIN check/update"
     echo
 }
 
 # Updating Nextclade. Checks last image available and if is already downloaded. If not, downloads it. Update related config files with nextclade info
 update_nextclade() {
     echo
-    echo_bold "Starting NEXTCLADE check/update."
-    echo "Checking Nextclade container version..."
+    echo_bold "Starting NEXTCLADE check/update."; log_message "Starting NEXTCLADE check/update."
+    echo "Checking Nextclade container version..."; log_message "Checking Nextclade container version..."
     url=$(curl -s "https://depot.galaxyproject.org/singularity/")
     latest_version_nextclade=$(echo "$url" | grep -oP 'nextclade:[^"]+' | sort -V | tail -n 1 | awk -F'>' '{print $1}' | sed 's/<\/a//')
     echo_bold "Latest version available of Nextclade:\e[1;38;5;220m $latest_version_nextclade"; tput sgr0
+    log_message "Latest version available of Nextclade: $latest_version_nextclade"
 
-    echo "Checking if latest version of Nextclade image is already downloaded..."
+    echo "Checking if latest version of Nextclade image is already downloaded..."; log_message "Checking if latest version of Nextclade image is already downloaded..."
     if [ -e "/data/bi/pipelines/singularity-images/$latest_version_nextclade" ]; then
-        echo "File $latest_version_nextclade already downloaded."
-        echo -e "Nextclade container is UP TO DATE. \xE2\x9C\x85"
+        echo "File $latest_version_nextclade already downloaded."; log_message "File $latest_version_nextclade already downloaded."
+        echo -e "Nextclade container is UP TO DATE. \xE2\x9C\x85"; log_message "Nextclade container is UP TO DATE. \xE2\x9C\x85"
     else
-        echo "Downloading $latest_version_nextclade file..."
+        echo "Downloading $latest_version_nextclade file..."; log_message "Downloading $latest_version_nextclade file..."
         wget -P "/data/bi/pipelines/singularity-images" "https://depot.galaxyproject.org/singularity/$latest_version_nextclade"
         if [ $? -eq 0 ]; then
-            echo_green "$latest_version_nextclade file succesfully downloaded."
+            echo_green "$latest_version_nextclade file succesfully downloaded."; log_message "$latest_version_nextclade file succesfully downloaded."
         else
-            echo_blinking_red "An error occurred during file downloading."
+            echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
         fi
     fi
 
     # Extracting the current Nextclade data TAG
-    echo "Extracting Nextclade data TAG..."
+    echo "Extracting Nextclade data TAG..."; log_message "Extracting Nextclade data TAG..."
     nextclade_tag=$(singularity run /data/bi/pipelines/singularity-images/$latest_version_nextclade nextclade dataset list --json | grep -zoP "\"path\":\s*\"nextstrain/${virus_tag}[^\"]*\"[\s\S]*?\"tag\":\s*\"\K[^\"]*" | tr '\0' '\n' | head -n 1)
     echo_bold "Latest \e[1;38;5;220m${virus_tag^^} \e[1;37mNextclade dataset version TAG:\e[1;38;5;220m $nextclade_tag"; tput sgr0
+    log_message "Latest ${virus_tag^^} Nextclade dataset version TAG: $nextclade_tag"
     
     # Updating config file
-    echo "Updating $CONFIG_FILE file..."
+    echo "Updating $CONFIG_FILE file..."; log_message "Updating $CONFIG_FILE file..."
     sed -i "s|nextclade:3.5.0--h9ee0642_0|$latest_version_nextclade|" "$CONFIG_FILE"
-    echo_bold "File $CONFIG_FILE UPDATED."
+    echo_bold "File $CONFIG_FILE UPDATED."; log_message "File $CONFIG_FILE UPDATED."
 
     # Updating params file
-    echo "Updating $PARAMS_FILE file..."
+    echo "Updating $PARAMS_FILE file..."; log_message "Updating $PARAMS_FILE file..."
     sed -i "s|skip_nextclade: true|skip_nextclade: false|" "$PARAMS_FILE"
     echo "nextclade_dataset: false" >> $PARAMS_FILE
-    echo_bold "File $PARAMS_FILE UPDATED."
+    echo_bold "File $PARAMS_FILE UPDATED."; log_message "File $PARAMS_FILE UPDATED."
 
-    echo_bold "Finished NEXTCLADE check/update"
+    echo_bold "Finished NEXTCLADE check/update"; log_message "Finished NEXTCLADE check/update"
     echo
 }
 
 # Checks if fasta and gff references are downloaded. If not, it downloads them (and creates family folder if neccesary)
 check_references() {
     echo
-    echo_bold "Processing reference: ${ref}."
+    echo_bold "Processing reference: ${ref}."; log_message "Processing reference: ${ref}."
 
     # Obtaining family information
     obtain_family() {
         organism_id=$(curl -s "https://www.ncbi.nlm.nih.gov/nuccore/${ref}" | grep -o 'ORGANISM=[0-9]\+' | head -n 1 | awk -F '=' '{print $2}')
         if [ -z $organism_id ]; then
-            echo_blinking_red "$ref not found in NCBI. Please download it manually."
+            echo_blinking_red "$ref not found in NCBI. Please download it manually."; log_message "$ref not found in NCBI. Please download it manually."
             return
         fi
         family=$(curl -s "https://www.ncbi.nlm.nih.gov/Taxonomy/Browser/wwwtax.cgi?id=${organism_id}" | grep -o 'TITLE="family">.*<' | awk -F 'TITLE="family">' '{print $2}' | cut -d '<' -f 1 | tr '[:upper:]' '[:lower:]')
         if [ -z $family ]; then
             family=$(curl -s "https://www.ncbi.nlm.nih.gov/Taxonomy/Browser/wwwtax.cgi?id=${organism_id}" | grep -o 'ALT="family">.*<' | awk -F 'ALT="family">' '{print $2}' | cut -d '<' -f 1 | tr '[:upper:]' '[:lower:]')
         fi
-        echo "Reference $ref belongs to $family family."
+        echo "Reference $ref belongs to $family family."; log_message "Reference $ref belongs to $family family."
     }
 
     # Check if FASTA sequence is already downloaded
     REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
     if [ -z "$REF_FASTA" ]; then
-        echo "File ${ref}.fasta is not yet downloaded."
+        echo "File ${ref}.fasta is not yet downloaded."; log_message "File ${ref}.fasta is not yet downloaded."
         obtain_family; if [ -z $family ]; then return; fi
         # Loading SAMtools module
         module load SAMtools
         SAMtools_loaded=$(module list | grep -o 'SAMtools/[0-9.]\+-GCC-[0-9.]\+')
         if [ -n "$SAMtools_loaded" ]; then
-            echo_green "$SAMtools_loaded module succesfully loaded."
+            echo_green "$SAMtools_loaded module succesfully loaded."; log_message "$SAMtools_loaded module succesfully loaded."
         else
-            echo_blinking_red "SAMtools module not loaded. Exiting..."
+            echo_blinking_red "SAMtools module not loaded. Exiting..."; log_message "SAMtools module not loaded. Exiting..."
             exit 1
         fi
         if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exists
             echo "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.fasta in /data/bi/references/refgenie/alias/${family}/fasta/${ref}."
+            log_message "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.fasta in /data/bi/references/refgenie/alias/${family}/fasta/${ref}."
             digest=$(openssl rand -hex 24)
             mkdir -p /data/bi/references/refgenie/data/${digest}/fasta/${ref}/
             wget -q -O "/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
             if [ $? -eq 0 ]; then
-                echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}"
+                echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}."
+                log_message "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}."
                 gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
                 refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R
                 bash /data/bi/references/refgenie/alias/ref.sh
                 REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
             else
-                echo_blinking_red "An error occurred during file downloading."
+                echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
             fi
         else
             echo "Directory /data/bi/references/refgenie/alias/${family}/ ALREADY EXISTS. Downloading ${ref}.fasta."
+            log_message "Directory /data/bi/references/refgenie/alias/${family}/ ALREADY EXISTS. Downloading ${ref}.fasta."
             digest=$(refgenie alias get -a ${family} -c /data/bi/references/refgenie/genome_config.yaml)
             mkdir -p /data/bi/references/refgenie/data/${digest}/fasta/${ref}/
             wget -q -O "/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
             if [ $? -eq 0 ]; then 
-                echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}"
+                echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}."
+                log_message "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}."
                 gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
                 refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R                bash /data/bi/references/refgenie/alias/ref.sh
                 REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
             else
-                echo_blinking_red "An error occurred during file downloading."
+                echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
             fi
         fi
     else
-        echo -e "File ${ref}.fasta is ALREADY available in $(dirname $REF_FASTA). \xE2\x9C\x85"
+        echo -e "File ${ref}.fasta is ALREADY available in $(dirname $REF_FASTA). \xE2\x9C\x85"; log_message "File ${ref}.fasta is ALREADY available in $(dirname $REF_FASTA). \xE2\x9C\x85"
     fi
 
     # Check if GFF file is already downloaded
     REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
     if [ -z "$REF_GFF" ]; then
-        echo "File ${ref}.gff is not yet downloaded."
+        echo "File ${ref}.gff is not yet downloaded."; log_message "File ${ref}.gff is not yet downloaded."
         if [ ! -v family ]; then obtain_family; if [ -z ${family} ]; then return; fi; fi
         if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exist
             echo "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.gff in /data/bi/references/refgenie/alias/${family}/gff/${ref}."
+            log_message "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.gff in /data/bi/references/refgenie/alias/${family}/gff/${ref}."
             digest=$(openssl rand -hex 24)
             refgenie alias set --aliases ${family} --digest ${digest} -f -c /data/bi/references/refgenie/genome_config.yaml
             mkdir -p /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/
             wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${ref}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
             if [ $? -eq 0 ]; then
-                echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}"
+                echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
+                log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
                 refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
                 bash /data/bi/references/refgenie/alias/ref.sh
                 REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
             else
-                echo_blinking_red "An error occurred during file downloading."
+                echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
             fi
          else
             echo "Directory /data/bi/references/refgenie/alias/${family}/ ALREADY EXISTS. Downloading ${ref}.gff."
+            log_message "Directory /data/bi/references/refgenie/alias/${family}/ ALREADY EXISTS. Downloading ${ref}.gff."
             digest=$(refgenie alias get -a ${family} -c /data/bi/references/refgenie/genome_config.yaml)
             mkdir -p /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/
             wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${ref}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
             if [ $? -eq 0 ]; then 
-                echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}"
+                echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
+                log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
                 refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
                 bash /data/bi/references/refgenie/alias/ref.sh
                 REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
             else
-                echo_blinking_red "An error occurred during file downloading."
+                echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
             fi
          fi
     else
-        echo -e "File ${ref}.gff is ALREADY available in $(dirname $REF_GFF). \xE2\x9C\x85"
+        echo -e "File ${ref}.gff is ALREADY available in $(dirname $REF_GFF). \xE2\x9C\x85"; log_message "File ${ref}.gff is ALREADY available in $(dirname $REF_GFF). \xE2\x9C\x85"
     fi
 
     unset family
 }
 ####################################
 
+
+echo_bold "Starting lablog_viralrecon execution."
+echo -e "$(date +'%Y-%m-%d %H:%M:%S') - Starting lablog_viralrecon execution." > lablog_viralrecon.log
+
 # Loading singularity module
-module purge
 module load singularity
 singularity_loaded=$(module list | grep singularity | awk '{print $2}')
 if [ -n "$singularity_loaded" ]; then
     echo_green "$singularity_loaded module succesfully loaded."
-    echo -e "$(date +'%Y-%m-%d %H:%M:%S')\t${singularity_loaded} module succesfully loaded." >> lablog_viralrecon.log
+    log_message "${singularity_loaded} module succesfully loaded."
 else
     echo_blinking_red "Singularity module not loaded. Exiting..."
+    log_message "Singularity module not loaded. Exiting..."
     exit 1
 fi
 
@@ -269,8 +281,8 @@ cp ../DOC/viralrecon.config ../DOC/${timeset}_viralrecon.config
 cp ../DOC/viralrecon_params.yml ../DOC/${timeset}_viralrecon_params.yml
 CONFIG_FILE="../DOC/${timeset}_viralrecon.config"
 PARAMS_FILE="../DOC/${timeset}_viralrecon_params.yml"
-echo "Created $CONFIG_FILE file."
-echo "Created $PARAMS_FILE file."
+echo "Created $CONFIG_FILE file."; log_message "Created $CONFIG_FILE file."
+echo "Created $PARAMS_FILE file."; log_message "Created $PARAMS_FILE file."
 echo
 
 # Setting the type of analysis
@@ -281,11 +293,11 @@ while true; do
     echo -ne "\e[1;38;5;220m"; read -n 1 ANALYSIS_TYPE; tput sgr0; echo
     if [ "$ANALYSIS_TYPE" == "1" ]; then
         ANALYSIS_TYPE="METAGENOMIC"
-        echo_green "$ANALYSIS_TYPE analysis selected."
+        echo_green "$ANALYSIS_TYPE analysis selected."; log_message "$ANALYSIS_TYPE analysis selected."
         break
     elif [ "$ANALYSIS_TYPE" == "2" ]; then
         ANALYSIS_TYPE="AMPLICONS"
-        echo_green "$ANALYSIS_TYPE analysis selected."
+        echo_green "$ANALYSIS_TYPE analysis selected."; log_message "$ANALYSIS_TYPE analysis selected."
         break
     else
         echo_red "Invalid input. Please enter 1 or 2."
@@ -299,15 +311,15 @@ echo_bold "\nPlease specify the method to be performed."
     while true; do
         echo -ne "\e[1;38;5;220m"; read -n 1 method; tput sgr0; echo
         if [ "$method" == "1" ]; then
-            echo_green "Mapping method selected."
+            echo_green "Mapping method selected."; log_message "Mapping method selected."
             break
         elif [ "$method" == "2" ]; then
-            echo_green "De novo assembly method selected."
+            echo_green "De novo assembly method selected."; log_message "De novo assembly method selected."
             sed -i "s|skip_assembly: true|skip_assembly: false|" "$PARAMS_FILE"
             sed -i "s|skip_variants: false|skip_variants: true|" "$PARAMS_FILE"
             break
         elif [ "$method" == "3" ]; then
-            echo_green "Mapping + de novo assembly methods selected."
+            echo_green "Mapping + de novo assembly methods selected."; log_message "Mapping + de novo assembly methods selected."
             sed -i "s|skip_assembly: true|skip_assembly: false|" "$PARAMS_FILE"
             break
         else
@@ -320,17 +332,17 @@ echo_bold "\nPlease specify the method to be performed."
 echo
 read -p $'\e[1;37mIs samples_ref.txt file already prepared? [y/N]: \e[1;38;5;220m' -n 1 samples_ref_prepared; tput sgr0; echo
 if [ "$samples_ref_prepared" == "y" ]; then 
-    echo -e "File samples_ref.txt READY. \xE2\x9C\x85"
+    echo -e "File samples_ref.txt READY. \xE2\x9C\x85"; log_message "File samples_ref.txt READY. \xE2\x9C\x85"
 else
     : > samples_ref.txt
-    echo "File samples_ref NOT prepared."
+    echo "File samples_ref NOT prepared."; log_message "File samples_ref NOT prepared."
     while [ -z "$host" ] || [ -z "$reference" ] || [ "$answer" = "n" ]; do
         read -p $'\e[1;37mPlease specify the host: \e[1;38;5;220m' host
         read -p $'\e[1;37mPlease specify the reference: \e[1;38;5;220m' reference
         read -p $'\e[1;37mAre host [\e[1;38;5;220m'"${host^^}"$'\e[1;37m] and reference [\e[1;38;5;220m'"${reference}"$'\e[1;37m] correct? [Y/n]: \e[1;38;5;220m' -n 1 answer; tput sgr0; echo
     done
     while read in; do echo -e "${in}\t${reference}\t${host^^}" >> samples_ref.txt; done < samples_id.txt
-    echo -e "File samples_ref.txt READY. \xE2\x9C\x85"
+    echo -e "File samples_ref.txt READY. \xE2\x9C\x85"; log_message "File samples_ref.txt READY. \xE2\x9C\x85. Host: ${host^^}. Reference: ${reference}."
 fi
 
 
@@ -361,15 +373,15 @@ else
         echo -ne "\e[1;38;5;220m"; read -n 1 virus_tag; tput sgr0; echo
         if [ "$virus_tag" == "1" ]; then
             virus_tag="sars-cov-2"
-            echo_green "${virus_tag^^} virus selected."
+            echo_green "${virus_tag^^} virus selected."; log_message "${virus_tag^^} virus selected."
             break
         elif [ "$virus_tag" == "2" ]; then
             virus_tag="rsv"
-            echo_green "${virus_tag^^} virus selected."
+            echo_green "${virus_tag^^} virus selected."; log_message "${virus_tag^^} virus selected."
             break
         elif [ "$virus_tag" == "3" ]; then
             virus_tag="Other"
-            echo_green "$virus_tag virus selected."
+            echo_green "$virus_tag virus selected."; log_message "$virus_tag virus selected."
             break
         else
             echo_red "Invalid input. Please select a valid number."
@@ -389,10 +401,12 @@ else
         update_nextclade
 
         echo_bold "\nRemember to provide the complete route to primer_bed and primer_fasta files, and specify the nextclade_dataset_name in every sbatch file before running the pipeline."
+        log_message "Remember to provide the complete route to primer_bed and primer_fasta files, and specify the nextclade_dataset_name in every sbatch file before running the pipeline."
 
     else
         echo "primer_bed: '../REFERENCES/XXXX'" >> $PARAMS_FILE
         echo_bold "\nRemember to provide the complete route to PRIMER_BED file in $PARAMS_FILE file before running the pipeline."
+        log_message "Remember to provide the complete route to PRIMER_BED file in $PARAMS_FILE file before running the pipeline."
     fi
 
 fi
@@ -475,3 +489,4 @@ rm _02_create_run_percentage_Ns.sh
 cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R1*.fastq.gz %_R1.fastq.gz" | bash; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R2*.fastq.gz %_R2.fastq.gz" | bash; cd ..
 
 echo_green "\nLablog_viralrecon execution has been completed. Please verify all the configurations are set up correctly."
+log_message "Lablog_viralrecon execution has been completed. Please verify all the configurations are set up correctly."

From 4385ce50d7fa560e0e1e0f323f0bb93b082a1f79 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Wed, 7 Aug 2024 10:00:42 +0200
Subject: [PATCH 137/321] Fixed typo

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 47b8ebf7e..7587b64da 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -276,7 +276,7 @@ else
 fi
 
 # Setting work variables
-timeset=$(date +"%Y-%m-%d_%H-%M-%S")_
+timeset=$(date +"%Y-%m-%d_%H-%M-%S")
 cp ../DOC/viralrecon.config ../DOC/${timeset}_viralrecon.config
 cp ../DOC/viralrecon_params.yml ../DOC/${timeset}_viralrecon_params.yml
 CONFIG_FILE="../DOC/${timeset}_viralrecon.config"

From caf50f31cf64447c61eb7f0d118fae73ad0e6b11 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Wed, 7 Aug 2024 13:17:29 +0200
Subject: [PATCH 138/321] Fixed log_message function when used outside service
 folder (pangolin database update)

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 7587b64da..2f8c29a7b 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -29,9 +29,10 @@ The functions performed by the script can be listed as follows:
 # Defining functions
 
 # Log message saving
+current_dir=$PWD
 log_message() {
     local message="$1"
-    echo -e "$(date '+%Y-%m-%d %H:%M:%S') - $message" >> lablog_viralrecon.log
+    echo -e "$(date '+%Y-%m-%d %H:%M:%S') - $message" >> $current_dir/lablog_viralrecon.log
 }
 
 

From 76581f4784d84294ccd285eb58b9d83d1c4e386c Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Wed, 7 Aug 2024 14:01:52 +0200
Subject: [PATCH 139/321] Fixed bug in check_references function

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 2f8c29a7b..1a245b7bc 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -206,6 +206,7 @@ check_references() {
                 log_message "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}."
                 gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
                 refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R                bash /data/bi/references/refgenie/alias/ref.sh
+                bash /data/bi/references/refgenie/alias/ref.sh
                 REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
             else
                 echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."

From c86be8204bb33866477c5eee3e85a2420b171e9b Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Wed, 7 Aug 2024 14:16:10 +0200
Subject: [PATCH 140/321] Added some messages when building and adding new
 references

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 1a245b7bc..294dbedfe 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -189,6 +189,7 @@ check_references() {
                 echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}."
                 log_message "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}."
                 gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
+                echo "Building asset for ${ref}.fasta file..."; log_message "Building asset for ${ref}.fasta file..."
                 refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R
                 bash /data/bi/references/refgenie/alias/ref.sh
                 REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
@@ -205,6 +206,7 @@ check_references() {
                 echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}."
                 log_message "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}."
                 gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
+                echo "Building asset for ${ref}.fasta file..."; log_message "Building asset for ${ref}.fasta file..."
                 refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R                bash /data/bi/references/refgenie/alias/ref.sh
                 bash /data/bi/references/refgenie/alias/ref.sh
                 REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
@@ -231,6 +233,7 @@ check_references() {
             if [ $? -eq 0 ]; then
                 echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
                 log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
+                echo "Adding asset for ${ref}.gff file..."; log_message "Building asset for ${ref}.gff file..."
                 refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
                 bash /data/bi/references/refgenie/alias/ref.sh
                 REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
@@ -246,6 +249,7 @@ check_references() {
             if [ $? -eq 0 ]; then 
                 echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
                 log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
+                echo "Adding asset for ${ref}.gff file..."; log_message "Building asset for ${ref}.gff file..."
                 refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
                 bash /data/bi/references/refgenie/alias/ref.sh
                 REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)

From b22611af202916761aada880f135e3f3b3bf7e4a Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Wed, 7 Aug 2024 15:51:42 +0200
Subject: [PATCH 141/321] Added srun to refgenie build and refgenie add
 functions. Created prompt and log messages

---
 .../viralrecon/ANALYSIS/lablog_viralrecon     | 20 +++++++++++++------
 1 file changed, 14 insertions(+), 6 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 294dbedfe..e293974d6 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -190,7 +190,9 @@ check_references() {
                 log_message "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}."
                 gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
                 echo "Building asset for ${ref}.fasta file..."; log_message "Building asset for ${ref}.fasta file..."
-                refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R
+                srun --partition short_idx --output ${ref}.fasta_build.log refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R
+                echo_bold "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
+                log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
                 bash /data/bi/references/refgenie/alias/ref.sh
                 REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
             else
@@ -207,7 +209,9 @@ check_references() {
                 log_message "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}."
                 gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
                 echo "Building asset for ${ref}.fasta file..."; log_message "Building asset for ${ref}.fasta file..."
-                refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R                bash /data/bi/references/refgenie/alias/ref.sh
+                srun --partition short_idx --output ${ref}.fasta_build.log refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R
+                echo_bold "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
+                log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
                 bash /data/bi/references/refgenie/alias/ref.sh
                 REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
             else
@@ -233,8 +237,10 @@ check_references() {
             if [ $? -eq 0 ]; then
                 echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
                 log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
-                echo "Adding asset for ${ref}.gff file..."; log_message "Building asset for ${ref}.gff file..."
-                refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+                echo "Adding asset for ${ref}.gff file..."; log_message "Adding asset for ${ref}.gff file..."
+                srun --partition short_idx --output ${ref}.gff_add.log refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+                echo_bold "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
+                log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
                 bash /data/bi/references/refgenie/alias/ref.sh
                 REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
             else
@@ -249,8 +255,10 @@ check_references() {
             if [ $? -eq 0 ]; then 
                 echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
                 log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
-                echo "Adding asset for ${ref}.gff file..."; log_message "Building asset for ${ref}.gff file..."
-                refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+                echo "Adding asset for ${ref}.gff file..."; log_message "Adding asset for ${ref}.gff file..."
+                srun --partition short_idx --output ${ref}.gff_add.log refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
+                echo_bold "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
+                log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
                 bash /data/bi/references/refgenie/alias/ref.sh
                 REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
             else

From 8e846ffd45a2754bad4009746d1771cabdaf4354 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 8 Aug 2024 13:07:03 +0200
Subject: [PATCH 142/321] Resolved CHANGELOG.md conflict

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 13c20e788..35b6a0478 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -58,6 +58,7 @@ Code contributions to the new version:
 - Fixed 99-stats (MAG) template. [#301](https://github.com/BU-ISCIII/buisciii-tools/pull/301)
 - Fixed IRMA's lablog so that the sequences of the samples are not displayed several times neither in the .txt files of each influenza type nor in all_samples_completo.txt [#305](https://github.com/BU-ISCIII/buisciii-tools/pull/305)
 - Modified bioinfo_doc.py so that new lines in the delivery message are applied in the email [#307](https://github.com/BU-ISCIII/buisciii-tools/pull/307)
+- Added several improvements in lablog_viralrecon (created log files, modified check_references function behaviour, enabled config files regeneration) [#306](https://github.com/BU-ISCIII/buisciii-tools/pull/306)
 
 ### Modules
 

From 1638ad84fca4cfe457120d7ef585f1a17743da74 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 8 Aug 2024 12:55:03 +0200
Subject: [PATCH 143/321] Modified message when pangolin-data is already
 updated. Added confirmation messages using grep (pangolin and constallations)
 with logfile inside database folder

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index e293974d6..bc6d04c1a 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -71,7 +71,10 @@ update_pangolin() {
     echo "Setting datadir for Pangolin database."; log_message "Setting datadir for Pangolin database."
     cd /data/bi/references/pangolin/
     if [ -e "./$(date '+%Y%m%d')" ]; then
-        echo -e "Pangolin database is UP TO DATE. \xE2\x9C\x85"; log_message "Pangolin database is UP TO DATE. \xE2\x9C\x85"
+        echo -e "Directory /data/bi/references/pangolin/$(date '+%Y%m%d') already exists. Assuming that a BU-ISCIII member previously updated pangolin database today. \xE2\x9C\x85"
+        log_message "Directory /data/bi/references/pangolin/$(date '+%Y%m%d') already exists. Assuming that a BU-ISCIII member previously updated pangolin database today. \xE2\x9C\x85"
+        echo_green "$(grep pangolin "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"; log_message "$(grep pangolin "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"
+        echo_green "$(grep constellations "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"; log_message "$(grep constellations "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"
     else
         mkdir "$(date '+%Y%m%d')"
         echo -e "$(date +'%Y-%m-%d %H:%M:%S') - mkdir $(date '+%Y%m%d')" >> $(date '+%Y%m%d')/command.log

From 9792924d3f15fa47bf2491122238f5de8b52d371 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 8 Aug 2024 13:05:25 +0200
Subject: [PATCH 144/321] Added checking stage por proper performance of
 refgenie build and refgenie add functions

---
 .../viralrecon/ANALYSIS/lablog_viralrecon     | 52 +++++++++++++------
 1 file changed, 36 insertions(+), 16 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index bc6d04c1a..3ee0241de 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -194,10 +194,15 @@ check_references() {
                 gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
                 echo "Building asset for ${ref}.fasta file..."; log_message "Building asset for ${ref}.fasta file..."
                 srun --partition short_idx --output ${ref}.fasta_build.log refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R
-                echo_bold "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
-                log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
-                bash /data/bi/references/refgenie/alias/ref.sh
-                REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+                if [ $? -eq 0 ]; then
+                    echo_bold "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
+                    log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
+                    bash /data/bi/references/refgenie/alias/ref.sh
+                    REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+                else
+                    echo_blinking_red "An error ocurred during building asset for ${ref}.fasta file."
+                    log_message "An error ocurred during building asset for ${ref}.fasta file."
+                fi
             else
                 echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
             fi
@@ -213,10 +218,15 @@ check_references() {
                 gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
                 echo "Building asset for ${ref}.fasta file..."; log_message "Building asset for ${ref}.fasta file..."
                 srun --partition short_idx --output ${ref}.fasta_build.log refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R
-                echo_bold "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
-                log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
-                bash /data/bi/references/refgenie/alias/ref.sh
-                REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+                if [ $? -eq 0 ]; then
+                    echo_bold "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
+                    log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
+                    bash /data/bi/references/refgenie/alias/ref.sh
+                    REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+                else
+                    echo_blinking_red "An error ocurred during building asset for ${ref}.fasta file."
+                    log_message "An error ocurred during building asset for ${ref}.fasta file."
+                fi
             else
                 echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
             fi
@@ -242,10 +252,15 @@ check_references() {
                 log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
                 echo "Adding asset for ${ref}.gff file..."; log_message "Adding asset for ${ref}.gff file..."
                 srun --partition short_idx --output ${ref}.gff_add.log refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
-                echo_bold "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
-                log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
-                bash /data/bi/references/refgenie/alias/ref.sh
-                REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+                if [ $? -eq 0 ]; then
+                    echo_bold "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
+                    log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
+                    bash /data/bi/references/refgenie/alias/ref.sh
+                    REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+                else
+                    echo_blinking_red "An error ocurred during adding asset for ${ref}.gff file."
+                    log_message "An error ocurred during adding asset for ${ref}.gff file."
+                fi
             else
                 echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
             fi
@@ -260,10 +275,15 @@ check_references() {
                 log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
                 echo "Adding asset for ${ref}.gff file..."; log_message "Adding asset for ${ref}.gff file..."
                 srun --partition short_idx --output ${ref}.gff_add.log refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
-                echo_bold "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
-                log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
-                bash /data/bi/references/refgenie/alias/ref.sh
-                REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+                if [ $? -eq 0 ]; then
+                    echo_bold "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
+                    log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
+                    bash /data/bi/references/refgenie/alias/ref.sh
+                    REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+                else
+                    echo_blinking_red "An error ocurred during adding asset for ${ref}.gff file."
+                    log_message "An error ocurred during adding asset for ${ref}.gff file."
+                fi
             else
                 echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
             fi

From b1586df8ae47c959f52c9cae7fd4094eba8511f5 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 8 Aug 2024 16:36:24 +0200
Subject: [PATCH 145/321] Updated log_message function including prompt message
 in terminal. Removed all duplicated messages

---
 .../viralrecon/ANALYSIS/lablog_viralrecon     | 223 +++++++++---------
 1 file changed, 110 insertions(+), 113 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 3ee0241de..e705f12de 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -28,11 +28,32 @@ The functions performed by the script can be listed as follows:
 ####################################
 # Defining functions
 
-# Log message saving
-current_dir=$PWD
+# Coloring messages and log saving
+logfile=$(echo "$PWD/lablog_viralrecon.log")
 log_message() {
     local message="$1"
-    echo -e "$(date '+%Y-%m-%d %H:%M:%S') - $message" >> $current_dir/lablog_viralrecon.log
+    case "$2" in
+        "bold")
+            echo -e "\e[1;37m$message\e[0m"
+            echo -e "$(date '+%Y-%m-%d %H:%M:%S') - \e[1;37m$message\e[0m" >> $logfile
+            ;;
+        "red")
+            echo -e "\e[31m$message\e[0m"
+            echo -e "$(date '+%Y-%m-%d %H:%M:%S') - \e[31m$message\e[0m" >> $logfile
+            ;;
+        "green")
+            echo -e "\e[32m$message\e[0m"
+            echo -e "$(date '+%Y-%m-%d %H:%M:%S') - \e[32m$message\e[0m" >> $logfile
+            ;;
+        "blk_red")
+            echo -e "\e[1;5;97;5;41m$message\e[0m"
+            echo -e "$(date '+%Y-%m-%d %H:%M:%S') - \e[1;5;97;5;41m$message\e[0m" >> $logfile
+            ;;
+        *)
+            echo -e "$message"
+            echo -e "$(date '+%Y-%m-%d %H:%M:%S') - $message" >> $logfile
+            ;;
+    esac
 }
 
 
@@ -46,250 +67,230 @@ echo_blinking_red() { echo -e "\e[1;5;97;5;41m$1\e[0m"; }
 # Updating pangolin. Checks last image available and if is already downloaded. If not, downloads it. This function also updates pangolin database. Update related config files with pangolin info
 update_pangolin() {
     echo
-    echo_bold "Starting PANGOLIN check/update."; log_message "Starting PANGOLIN check/update."
-    echo "Checking Pangolin container version..."; log_message "Checking Pangolin container version..."
+    log_message "Starting PANGOLIN check/update." bold
+    log_message "Checking Pangolin container version..."
     url=$(curl -s "https://depot.galaxyproject.org/singularity/")
     latest_version_pangolin=$(echo "$url" | grep -oP 'pangolin:[^"]+' | sort -V | tail -n 1 | awk -F'>' '{print $1}' | sed 's/<\/a//')
-    echo_bold "Latest version available of Pangolin:\e[1;38;5;220m $latest_version_pangolin"; tput sgr0
-    log_message "Latest version available of Pangolin: $latest_version_pangolin"
+    log_message "Latest version available of Pangolin:\e[1;38;5;220m $latest_version_pangolin" bold
 
-    echo "Checking if latest version of Pangolin image is already downloaded..."; log_message "Checking if latest version of Pangolin image is already downloaded..."
+    log_message "Checking if latest version of Pangolin image is already downloaded..."
     if [ -e "/data/bi/pipelines/singularity-images/$latest_version_pangolin" ]; then
-        echo "File $latest_version_pangolin already downloaded."; log_message "File $latest_version_pangolin already downloaded."
-        echo -e "Pangolin container is UP TO DATE. \xE2\x9C\x85"; log_message "Pangolin container is UP TO DATE. \xE2\x9C\x85"
+        log_message "File $latest_version_pangolin already downloaded."
+        log_message "Pangolin container is UP TO DATE. \xE2\x9C\x85"
     else
-        echo "Downloading $latest_version_pangolin file..."; log_message "Downloading $latest_version_pangolin file..."
+        log_message "Downloading $latest_version_pangolin file..."
         wget -P "/data/bi/pipelines/singularity-images/" "https://depot.galaxyproject.org/singularity/$latest_version_pangolin"
         if [ $? -eq 0 ]; then
-            echo_green "$latest_version_pangolin file succesfully downloaded."; log_message "$latest_version_pangolin file succesfully downloaded."
+            log_message "$latest_version_pangolin file succesfully downloaded." green
         else
-            echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
+            log_message "An error occurred during file downloading." blk_red
         fi
     fi
 
     # Updating Pangolin database
-    echo "Setting datadir for Pangolin database."; log_message "Setting datadir for Pangolin database."
+    log_message "Setting datadir for Pangolin database."
     cd /data/bi/references/pangolin/
     if [ -e "./$(date '+%Y%m%d')" ]; then
-        echo -e "Directory /data/bi/references/pangolin/$(date '+%Y%m%d') already exists. Assuming that a BU-ISCIII member previously updated pangolin database today. \xE2\x9C\x85"
         log_message "Directory /data/bi/references/pangolin/$(date '+%Y%m%d') already exists. Assuming that a BU-ISCIII member previously updated pangolin database today. \xE2\x9C\x85"
-        echo_green "$(grep pangolin "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"; log_message "$(grep pangolin "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"
-        echo_green "$(grep constellations "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"; log_message "$(grep constellations "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"
+        log_message "$(grep pangolin "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")" green
+        log_message "$(grep constellations "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")" green
     else
         mkdir "$(date '+%Y%m%d')"
         echo -e "$(date +'%Y-%m-%d %H:%M:%S') - mkdir $(date '+%Y%m%d')" >> $(date '+%Y%m%d')/command.log
         echo -e "$(date +'%Y-%m-%d %H:%M:%S') - srun --partition short_idx --output ${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log singularity run -B ${PWD} /data/bi/pipelines/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/)" >> $(date '+%Y%m%d')/command.log
         srun --partition short_idx --output ${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log singularity run -B ${PWD} /data/bi/pipelines/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/
         if [ $? -eq 0 ]; then
-            echo_green "$(grep pangolin "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"; log_message "$(grep pangolin "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"
-            echo_green "$(grep constellations "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"; log_message "$(grep constellations "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")"
+            log_message "$(grep pangolin "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")" green
+            log_message "$(grep constellations "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")" green
         else
-            echo_blinking_red "Error during pangolin database update."; log_message "Error during pangolin database update."
+            log_message "Error during pangolin database update." blk_red
         fi
     fi
     cd -
 
     # Updating config file
-    echo "Updating $CONFIG_FILE file..."; log_message "Updating $CONFIG_FILE file..."
+    log_message "Updating $CONFIG_FILE file..."
     sed -i "s|pangolin:4.3--pyhdfd78af_2|$latest_version_pangolin|" "$CONFIG_FILE"
     sed -i "s|--datadir XXXX|--datadir $(ls -dt /data/bi/references/pangolin/*/ | head -n 1)|" "$CONFIG_FILE"
-    echo_bold "File $CONFIG_FILE UPDATED."; log_message "File $CONFIG_FILE UPDATED."
+    log_message "File $CONFIG_FILE UPDATED."
 
     # Updating params file
-    echo "Updating $PARAMS_FILE file..."; log_message "Updating $PARAMS_FILE file..."
+    log_message "Updating $PARAMS_FILE file..."
     sed -i "s|skip_pangolin: true|skip_pangolin: false|" "$PARAMS_FILE"
-    echo_bold "File $PARAMS_FILE UPDATED."; log_message "File $PARAMS_FILE UPDATED."
+    log_message "File $PARAMS_FILE UPDATED."
 
-    echo_bold "Finished PANGOLIN check/update"; log_message "Finished PANGOLIN check/update"
+    log_message "Finished PANGOLIN check/update" bold
     echo
 }
 
 # Updating Nextclade. Checks last image available and if is already downloaded. If not, downloads it. Update related config files with nextclade info
 update_nextclade() {
     echo
-    echo_bold "Starting NEXTCLADE check/update."; log_message "Starting NEXTCLADE check/update."
-    echo "Checking Nextclade container version..."; log_message "Checking Nextclade container version..."
+    log_message "Starting NEXTCLADE check/update." bold
+    log_message "Checking Nextclade container version..."
     url=$(curl -s "https://depot.galaxyproject.org/singularity/")
     latest_version_nextclade=$(echo "$url" | grep -oP 'nextclade:[^"]+' | sort -V | tail -n 1 | awk -F'>' '{print $1}' | sed 's/<\/a//')
-    echo_bold "Latest version available of Nextclade:\e[1;38;5;220m $latest_version_nextclade"; tput sgr0
-    log_message "Latest version available of Nextclade: $latest_version_nextclade"
+    log_message "Latest version available of Nextclade:\e[1;38;5;220m $latest_version_nextclade"
 
-    echo "Checking if latest version of Nextclade image is already downloaded..."; log_message "Checking if latest version of Nextclade image is already downloaded..."
+    log_message "Checking if latest version of Nextclade image is already downloaded..."
     if [ -e "/data/bi/pipelines/singularity-images/$latest_version_nextclade" ]; then
-        echo "File $latest_version_nextclade already downloaded."; log_message "File $latest_version_nextclade already downloaded."
-        echo -e "Nextclade container is UP TO DATE. \xE2\x9C\x85"; log_message "Nextclade container is UP TO DATE. \xE2\x9C\x85"
+        log_message "File $latest_version_nextclade already downloaded."
+        log_message "Nextclade container is UP TO DATE. \xE2\x9C\x85"
     else
-        echo "Downloading $latest_version_nextclade file..."; log_message "Downloading $latest_version_nextclade file..."
+        log_message "Downloading $latest_version_nextclade file..."
         wget -P "/data/bi/pipelines/singularity-images" "https://depot.galaxyproject.org/singularity/$latest_version_nextclade"
         if [ $? -eq 0 ]; then
-            echo_green "$latest_version_nextclade file succesfully downloaded."; log_message "$latest_version_nextclade file succesfully downloaded."
+            log_message "$latest_version_nextclade file succesfully downloaded." green
         else
-            echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
+            log_message "An error occurred during file downloading." blk_red
         fi
     fi
 
     # Extracting the current Nextclade data TAG
-    echo "Extracting Nextclade data TAG..."; log_message "Extracting Nextclade data TAG..."
+    log_message "Extracting Nextclade data TAG..."
     nextclade_tag=$(singularity run /data/bi/pipelines/singularity-images/$latest_version_nextclade nextclade dataset list --json | grep -zoP "\"path\":\s*\"nextstrain/${virus_tag}[^\"]*\"[\s\S]*?\"tag\":\s*\"\K[^\"]*" | tr '\0' '\n' | head -n 1)
-    echo_bold "Latest \e[1;38;5;220m${virus_tag^^} \e[1;37mNextclade dataset version TAG:\e[1;38;5;220m $nextclade_tag"; tput sgr0
-    log_message "Latest ${virus_tag^^} Nextclade dataset version TAG: $nextclade_tag"
+    log_message "Latest \e[1;38;5;220m${virus_tag^^} \e[1;37mNextclade dataset version TAG:\e[1;38;5;220m $nextclade_tag" bold
     
     # Updating config file
-    echo "Updating $CONFIG_FILE file..."; log_message "Updating $CONFIG_FILE file..."
+    log_message "Updating $CONFIG_FILE file..."
     sed -i "s|nextclade:3.5.0--h9ee0642_0|$latest_version_nextclade|" "$CONFIG_FILE"
-    echo_bold "File $CONFIG_FILE UPDATED."; log_message "File $CONFIG_FILE UPDATED."
+    log_message "File $CONFIG_FILE UPDATED."
 
     # Updating params file
-    echo "Updating $PARAMS_FILE file..."; log_message "Updating $PARAMS_FILE file..."
+    log_message "Updating $PARAMS_FILE file..."
     sed -i "s|skip_nextclade: true|skip_nextclade: false|" "$PARAMS_FILE"
     echo "nextclade_dataset: false" >> $PARAMS_FILE
-    echo_bold "File $PARAMS_FILE UPDATED."; log_message "File $PARAMS_FILE UPDATED."
+    log_message "File $PARAMS_FILE UPDATED."
 
-    echo_bold "Finished NEXTCLADE check/update"; log_message "Finished NEXTCLADE check/update"
+    log_message "Finished NEXTCLADE check/update" bold
     echo
 }
 
 # Checks if fasta and gff references are downloaded. If not, it downloads them (and creates family folder if neccesary)
 check_references() {
     echo
-    echo_bold "Processing reference: ${ref}."; log_message "Processing reference: ${ref}."
+    log_message "Processing reference: ${ref}." bold
 
     # Obtaining family information
     obtain_family() {
         organism_id=$(curl -s "https://www.ncbi.nlm.nih.gov/nuccore/${ref}" | grep -o 'ORGANISM=[0-9]\+' | head -n 1 | awk -F '=' '{print $2}')
         if [ -z $organism_id ]; then
-            echo_blinking_red "$ref not found in NCBI. Please download it manually."; log_message "$ref not found in NCBI. Please download it manually."
+            log_message "$ref not found in NCBI. Please download it manually." blk_red
             return
         fi
         family=$(curl -s "https://www.ncbi.nlm.nih.gov/Taxonomy/Browser/wwwtax.cgi?id=${organism_id}" | grep -o 'TITLE="family">.*<' | awk -F 'TITLE="family">' '{print $2}' | cut -d '<' -f 1 | tr '[:upper:]' '[:lower:]')
         if [ -z $family ]; then
             family=$(curl -s "https://www.ncbi.nlm.nih.gov/Taxonomy/Browser/wwwtax.cgi?id=${organism_id}" | grep -o 'ALT="family">.*<' | awk -F 'ALT="family">' '{print $2}' | cut -d '<' -f 1 | tr '[:upper:]' '[:lower:]')
         fi
-        echo "Reference $ref belongs to $family family."; log_message "Reference $ref belongs to $family family."
+        log_message "Reference $ref belongs to $family family."
     }
 
     # Check if FASTA sequence is already downloaded
     REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
     if [ -z "$REF_FASTA" ]; then
-        echo "File ${ref}.fasta is not yet downloaded."; log_message "File ${ref}.fasta is not yet downloaded."
+        log_message "File ${ref}.fasta is not yet downloaded."
         obtain_family; if [ -z $family ]; then return; fi
         # Loading SAMtools module
         module load SAMtools
         SAMtools_loaded=$(module list | grep -o 'SAMtools/[0-9.]\+-GCC-[0-9.]\+')
         if [ -n "$SAMtools_loaded" ]; then
-            echo_green "$SAMtools_loaded module succesfully loaded."; log_message "$SAMtools_loaded module succesfully loaded."
+            log_message "$SAMtools_loaded module succesfully loaded." green
         else
-            echo_blinking_red "SAMtools module not loaded. Exiting..."; log_message "SAMtools module not loaded. Exiting..."
+            log_message "SAMtools module not loaded. Exiting..." blk_red
             exit 1
         fi
         if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exists
-            echo "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.fasta in /data/bi/references/refgenie/alias/${family}/fasta/${ref}."
             log_message "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.fasta in /data/bi/references/refgenie/alias/${family}/fasta/${ref}."
             digest=$(openssl rand -hex 24)
             mkdir -p /data/bi/references/refgenie/data/${digest}/fasta/${ref}/
             wget -q -O "/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
             if [ $? -eq 0 ]; then
-                echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}."
-                log_message "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}."
+                log_message "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}." green
                 gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
-                echo "Building asset for ${ref}.fasta file..."; log_message "Building asset for ${ref}.fasta file..."
+                log_message "Building asset for ${ref}.fasta file..."
                 srun --partition short_idx --output ${ref}.fasta_build.log refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R
                 if [ $? -eq 0 ]; then
-                    echo_bold "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
-                    log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
+                    log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)" bold
                     bash /data/bi/references/refgenie/alias/ref.sh
                     REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
                 else
-                    echo_blinking_red "An error ocurred during building asset for ${ref}.fasta file."
-                    log_message "An error ocurred during building asset for ${ref}.fasta file."
+                    log_message "An error ocurred during building asset for ${ref}.fasta file." blk_red
                 fi
             else
-                echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
+                log_message "An error occurred during file downloading." blk_red
             fi
         else
-            echo "Directory /data/bi/references/refgenie/alias/${family}/ ALREADY EXISTS. Downloading ${ref}.fasta."
             log_message "Directory /data/bi/references/refgenie/alias/${family}/ ALREADY EXISTS. Downloading ${ref}.fasta."
             digest=$(refgenie alias get -a ${family} -c /data/bi/references/refgenie/genome_config.yaml)
             mkdir -p /data/bi/references/refgenie/data/${digest}/fasta/${ref}/
             wget -q -O "/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
             if [ $? -eq 0 ]; then 
-                echo_green "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}."
-                log_message "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}."
+                log_message "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}." green
                 gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
-                echo "Building asset for ${ref}.fasta file..."; log_message "Building asset for ${ref}.fasta file..."
+                log_message "Building asset for ${ref}.fasta file..."
                 srun --partition short_idx --output ${ref}.fasta_build.log refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R
                 if [ $? -eq 0 ]; then
-                    echo_bold "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
-                    log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)"
+                    log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)" bold
                     bash /data/bi/references/refgenie/alias/ref.sh
                     REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
                 else
-                    echo_blinking_red "An error ocurred during building asset for ${ref}.fasta file."
-                    log_message "An error ocurred during building asset for ${ref}.fasta file."
+                    log_message "An error ocurred during building asset for ${ref}.fasta file." blk_red
                 fi
             else
-                echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
+                log_message "An error occurred during file downloading." blk_red
             fi
         fi
     else
-        echo -e "File ${ref}.fasta is ALREADY available in $(dirname $REF_FASTA). \xE2\x9C\x85"; log_message "File ${ref}.fasta is ALREADY available in $(dirname $REF_FASTA). \xE2\x9C\x85"
+        log_message "File ${ref}.fasta is ALREADY available in $(dirname $REF_FASTA). \xE2\x9C\x85"
     fi
 
     # Check if GFF file is already downloaded
     REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
     if [ -z "$REF_GFF" ]; then
-        echo "File ${ref}.gff is not yet downloaded."; log_message "File ${ref}.gff is not yet downloaded."
+        log_message "File ${ref}.gff is not yet downloaded."
         if [ ! -v family ]; then obtain_family; if [ -z ${family} ]; then return; fi; fi
         if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exist
-            echo "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.gff in /data/bi/references/refgenie/alias/${family}/gff/${ref}."
             log_message "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.gff in /data/bi/references/refgenie/alias/${family}/gff/${ref}."
             digest=$(openssl rand -hex 24)
             refgenie alias set --aliases ${family} --digest ${digest} -f -c /data/bi/references/refgenie/genome_config.yaml
             mkdir -p /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/
             wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${ref}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
             if [ $? -eq 0 ]; then
-                echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
-                log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
-                echo "Adding asset for ${ref}.gff file..."; log_message "Adding asset for ${ref}.gff file..."
+                log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}." green
+                log_message "Adding asset for ${ref}.gff file..."
                 srun --partition short_idx --output ${ref}.gff_add.log refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
                 if [ $? -eq 0 ]; then
-                    echo_bold "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
-                    log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
+                    log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)" bold
                     bash /data/bi/references/refgenie/alias/ref.sh
                     REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
                 else
-                    echo_blinking_red "An error ocurred during adding asset for ${ref}.gff file."
-                    log_message "An error ocurred during adding asset for ${ref}.gff file."
+                    log_message "An error ocurred during adding asset for ${ref}.gff file." blk_red
                 fi
             else
-                echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
+                log_message "An error occurred during file downloading." blk_red
             fi
          else
-            echo "Directory /data/bi/references/refgenie/alias/${family}/ ALREADY EXISTS. Downloading ${ref}.gff."
             log_message "Directory /data/bi/references/refgenie/alias/${family}/ ALREADY EXISTS. Downloading ${ref}.gff."
             digest=$(refgenie alias get -a ${family} -c /data/bi/references/refgenie/genome_config.yaml)
             mkdir -p /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/
             wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${ref}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
             if [ $? -eq 0 ]; then 
-                echo_green "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
-                log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}."
-                echo "Adding asset for ${ref}.gff file..."; log_message "Adding asset for ${ref}.gff file..."
+                log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}." green
+                log_message "Adding asset for ${ref}.gff file..."
                 srun --partition short_idx --output ${ref}.gff_add.log refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
                 if [ $? -eq 0 ]; then
-                    echo_bold "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
-                    log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)"
+                    log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)" bold
                     bash /data/bi/references/refgenie/alias/ref.sh
                     REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
                 else
-                    echo_blinking_red "An error ocurred during adding asset for ${ref}.gff file."
-                    log_message "An error ocurred during adding asset for ${ref}.gff file."
+                    log_message "An error ocurred during adding asset for ${ref}.gff file." blk_red
                 fi
             else
-                echo_blinking_red "An error occurred during file downloading."; log_message "An error occurred during file downloading."
+                log_message "An error occurred during file downloading." blk_red
             fi
          fi
     else
-        echo -e "File ${ref}.gff is ALREADY available in $(dirname $REF_GFF). \xE2\x9C\x85"; log_message "File ${ref}.gff is ALREADY available in $(dirname $REF_GFF). \xE2\x9C\x85"
+        log_message "File ${ref}.gff is ALREADY available in $(dirname $REF_GFF). \xE2\x9C\x85"
     fi
 
     unset family
@@ -297,18 +298,16 @@ check_references() {
 ####################################
 
 
-echo_bold "Starting lablog_viralrecon execution."
-echo -e "$(date +'%Y-%m-%d %H:%M:%S') - Starting lablog_viralrecon execution." > lablog_viralrecon.log
+echo -e "\e[1;37mStarting lablog_viralrecon execution.\e[0m"
+echo -e "$(date +'%Y-%m-%d %H:%M:%S') - \e[1;37mStarting lablog_viralrecon execution.\e[0m" > $logfile
 
 # Loading singularity module
 module load singularity
 singularity_loaded=$(module list | grep singularity | awk '{print $2}')
 if [ -n "$singularity_loaded" ]; then
-    echo_green "$singularity_loaded module succesfully loaded."
-    log_message "${singularity_loaded} module succesfully loaded."
+    log_message "${singularity_loaded} module succesfully loaded." green
 else
-    echo_blinking_red "Singularity module not loaded. Exiting..."
-    log_message "Singularity module not loaded. Exiting..."
+    log_message "Singularity module not loaded. Exiting..." blk_red
     exit 1
 fi
 
@@ -318,8 +317,8 @@ cp ../DOC/viralrecon.config ../DOC/${timeset}_viralrecon.config
 cp ../DOC/viralrecon_params.yml ../DOC/${timeset}_viralrecon_params.yml
 CONFIG_FILE="../DOC/${timeset}_viralrecon.config"
 PARAMS_FILE="../DOC/${timeset}_viralrecon_params.yml"
-echo "Created $CONFIG_FILE file."; log_message "Created $CONFIG_FILE file."
-echo "Created $PARAMS_FILE file."; log_message "Created $PARAMS_FILE file."
+log_message "Created $CONFIG_FILE file."
+log_message "Created $PARAMS_FILE file."
 echo
 
 # Setting the type of analysis
@@ -330,11 +329,11 @@ while true; do
     echo -ne "\e[1;38;5;220m"; read -n 1 ANALYSIS_TYPE; tput sgr0; echo
     if [ "$ANALYSIS_TYPE" == "1" ]; then
         ANALYSIS_TYPE="METAGENOMIC"
-        echo_green "$ANALYSIS_TYPE analysis selected."; log_message "$ANALYSIS_TYPE analysis selected."
+        log_message "$ANALYSIS_TYPE analysis selected." green
         break
     elif [ "$ANALYSIS_TYPE" == "2" ]; then
         ANALYSIS_TYPE="AMPLICONS"
-        echo_green "$ANALYSIS_TYPE analysis selected."; log_message "$ANALYSIS_TYPE analysis selected."
+        log_message "$ANALYSIS_TYPE analysis selected." green
         break
     else
         echo_red "Invalid input. Please enter 1 or 2."
@@ -348,15 +347,15 @@ echo_bold "\nPlease specify the method to be performed."
     while true; do
         echo -ne "\e[1;38;5;220m"; read -n 1 method; tput sgr0; echo
         if [ "$method" == "1" ]; then
-            echo_green "Mapping method selected."; log_message "Mapping method selected."
+            log_message "Mapping method selected." green
             break
         elif [ "$method" == "2" ]; then
-            echo_green "De novo assembly method selected."; log_message "De novo assembly method selected."
+            log_message "De novo assembly method selected." green
             sed -i "s|skip_assembly: true|skip_assembly: false|" "$PARAMS_FILE"
             sed -i "s|skip_variants: false|skip_variants: true|" "$PARAMS_FILE"
             break
         elif [ "$method" == "3" ]; then
-            echo_green "Mapping + de novo assembly methods selected."; log_message "Mapping + de novo assembly methods selected."
+            log_message "Mapping + de novo assembly methods selected." green
             sed -i "s|skip_assembly: true|skip_assembly: false|" "$PARAMS_FILE"
             break
         else
@@ -369,17 +368,17 @@ echo_bold "\nPlease specify the method to be performed."
 echo
 read -p $'\e[1;37mIs samples_ref.txt file already prepared? [y/N]: \e[1;38;5;220m' -n 1 samples_ref_prepared; tput sgr0; echo
 if [ "$samples_ref_prepared" == "y" ]; then 
-    echo -e "File samples_ref.txt READY. \xE2\x9C\x85"; log_message "File samples_ref.txt READY. \xE2\x9C\x85"
+    log_message "File samples_ref.txt READY. \xE2\x9C\x85"
 else
     : > samples_ref.txt
-    echo "File samples_ref NOT prepared."; log_message "File samples_ref NOT prepared."
+    log_message "File samples_ref NOT prepared."
     while [ -z "$host" ] || [ -z "$reference" ] || [ "$answer" = "n" ]; do
         read -p $'\e[1;37mPlease specify the host: \e[1;38;5;220m' host
         read -p $'\e[1;37mPlease specify the reference: \e[1;38;5;220m' reference
         read -p $'\e[1;37mAre host [\e[1;38;5;220m'"${host^^}"$'\e[1;37m] and reference [\e[1;38;5;220m'"${reference}"$'\e[1;37m] correct? [Y/n]: \e[1;38;5;220m' -n 1 answer; tput sgr0; echo
     done
     while read in; do echo -e "${in}\t${reference}\t${host^^}" >> samples_ref.txt; done < samples_id.txt
-    echo -e "File samples_ref.txt READY. \xE2\x9C\x85"; log_message "File samples_ref.txt READY. \xE2\x9C\x85. Host: ${host^^}. Reference: ${reference}."
+    log_message "File samples_ref.txt READY. \xE2\x9C\x85. Host: ${host^^}. Reference: ${reference}."
 fi
 
 
@@ -391,6 +390,7 @@ if [ "$ANALYSIS_TYPE" = "METAGENOMIC" ]; then
     read -p $'\e[1;37mDo the sequences correspond to monkeypox virus (MPV)? [y/N]: \e[1;38;5;220m' -n 1 monkeypox; tput sgr0; echo
     if [ "$monkeypox" == "y" ]; then
 
+        log_message "Monkeypox virus (MPV) analisys selected"
         virus_tag='mpox'
         # Update Nextclade
         update_nextclade
@@ -410,15 +410,15 @@ else
         echo -ne "\e[1;38;5;220m"; read -n 1 virus_tag; tput sgr0; echo
         if [ "$virus_tag" == "1" ]; then
             virus_tag="sars-cov-2"
-            echo_green "${virus_tag^^} virus selected."; log_message "${virus_tag^^} virus selected."
+            log_message "${virus_tag^^} virus selected." green
             break
         elif [ "$virus_tag" == "2" ]; then
             virus_tag="rsv"
-            echo_green "${virus_tag^^} virus selected."; log_message "${virus_tag^^} virus selected."
+            log_message "${virus_tag^^} virus selected." green
             break
         elif [ "$virus_tag" == "3" ]; then
             virus_tag="Other"
-            echo_green "$virus_tag virus selected."; log_message "$virus_tag virus selected."
+            log_message "$virus_tag virus selected." green
             break
         else
             echo_red "Invalid input. Please select a valid number."
@@ -437,13 +437,11 @@ else
         # Update Nextclade
         update_nextclade
 
-        echo_bold "\nRemember to provide the complete route to primer_bed and primer_fasta files, and specify the nextclade_dataset_name in every sbatch file before running the pipeline."
-        log_message "Remember to provide the complete route to primer_bed and primer_fasta files, and specify the nextclade_dataset_name in every sbatch file before running the pipeline."
+        log_message "Remember to provide the complete route to primer_bed and primer_fasta files, and specify the nextclade_dataset_name in every sbatch file before running the pipeline." bold
 
     else
         echo "primer_bed: '../REFERENCES/XXXX'" >> $PARAMS_FILE
-        echo_bold "\nRemember to provide the complete route to PRIMER_BED file in $PARAMS_FILE file before running the pipeline."
-        log_message "Remember to provide the complete route to PRIMER_BED file in $PARAMS_FILE file before running the pipeline."
+        log_message "Remember to provide the complete route to PRIMER_BED file in $PARAMS_FILE file before running the pipeline." bold
     fi
 
 fi
@@ -525,5 +523,4 @@ rm percentajeNs.py
 rm _02_create_run_percentage_Ns.sh
 cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R1*.fastq.gz %_R1.fastq.gz" | bash; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R2*.fastq.gz %_R2.fastq.gz" | bash; cd ..
 
-echo_green "\nLablog_viralrecon execution has been completed. Please verify all the configurations are set up correctly."
-log_message "Lablog_viralrecon execution has been completed. Please verify all the configurations are set up correctly."
+log_message "Lablog_viralrecon execution has been completed. Please verify all the configurations are set up correctly." green

From cbd7183dd9b50c4690002c090a7f374965f0fced Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Thu, 8 Aug 2024 16:41:33 +0200
Subject: [PATCH 146/321] Fixed bug

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index e705f12de..b31243c2e 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -130,7 +130,7 @@ update_nextclade() {
     log_message "Checking Nextclade container version..."
     url=$(curl -s "https://depot.galaxyproject.org/singularity/")
     latest_version_nextclade=$(echo "$url" | grep -oP 'nextclade:[^"]+' | sort -V | tail -n 1 | awk -F'>' '{print $1}' | sed 's/<\/a//')
-    log_message "Latest version available of Nextclade:\e[1;38;5;220m $latest_version_nextclade"
+    log_message "Latest version available of Nextclade:\e[1;38;5;220m $latest_version_nextclade" bold
 
     log_message "Checking if latest version of Nextclade image is already downloaded..."
     if [ -e "/data/bi/pipelines/singularity-images/$latest_version_nextclade" ]; then

From 63f69d771fe772785bcc4e57e302a5e2f8066302 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Fri, 9 Aug 2024 11:29:40 +0200
Subject: [PATCH 147/321] Added timestamp variable to log_message function

---
 .../viralrecon/ANALYSIS/lablog_viralrecon     | 20 +++++++++----------
 1 file changed, 10 insertions(+), 10 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index b31243c2e..02c5b055a 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -30,28 +30,29 @@ The functions performed by the script can be listed as follows:
 
 # Coloring messages and log saving
 logfile=$(echo "$PWD/lablog_viralrecon.log")
+timestamp=$(date +"%Y-%m-%d_%H-%M-%S")
 log_message() {
     local message="$1"
     case "$2" in
         "bold")
             echo -e "\e[1;37m$message\e[0m"
-            echo -e "$(date '+%Y-%m-%d %H:%M:%S') - \e[1;37m$message\e[0m" >> $logfile
+            echo -e "$timestamp - \e[1;37m$message\e[0m" >> $logfile
             ;;
         "red")
             echo -e "\e[31m$message\e[0m"
-            echo -e "$(date '+%Y-%m-%d %H:%M:%S') - \e[31m$message\e[0m" >> $logfile
+            echo -e "$timestamp - \e[31m$message\e[0m" >> $logfile
             ;;
         "green")
             echo -e "\e[32m$message\e[0m"
-            echo -e "$(date '+%Y-%m-%d %H:%M:%S') - \e[32m$message\e[0m" >> $logfile
+            echo -e "$timestamp - \e[32m$message\e[0m" >> $logfile
             ;;
         "blk_red")
             echo -e "\e[1;5;97;5;41m$message\e[0m"
-            echo -e "$(date '+%Y-%m-%d %H:%M:%S') - \e[1;5;97;5;41m$message\e[0m" >> $logfile
+            echo -e "$timestamp - \e[1;5;97;5;41m$message\e[0m" >> $logfile
             ;;
         *)
             echo -e "$message"
-            echo -e "$(date '+%Y-%m-%d %H:%M:%S') - $message" >> $logfile
+            echo -e "$timestamp - $message" >> $logfile
             ;;
     esac
 }
@@ -312,11 +313,10 @@ else
 fi
 
 # Setting work variables
-timeset=$(date +"%Y-%m-%d_%H-%M-%S")
-cp ../DOC/viralrecon.config ../DOC/${timeset}_viralrecon.config
-cp ../DOC/viralrecon_params.yml ../DOC/${timeset}_viralrecon_params.yml
-CONFIG_FILE="../DOC/${timeset}_viralrecon.config"
-PARAMS_FILE="../DOC/${timeset}_viralrecon_params.yml"
+cp ../DOC/viralrecon.config ../DOC/${timestamp}_viralrecon.config
+cp ../DOC/viralrecon_params.yml ../DOC/${timestamp}_viralrecon_params.yml
+CONFIG_FILE="../DOC/${timestamp}_viralrecon.config"
+PARAMS_FILE="../DOC/${timestamp}_viralrecon_params.yml"
 log_message "Created $CONFIG_FILE file."
 log_message "Created $PARAMS_FILE file."
 echo

From dbf8de4412f7edc3f22d704407d17650fb31d000 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Fri, 9 Aug 2024 14:54:52 +0200
Subject: [PATCH 148/321] Fixed bug. Now, references with no family are
 assigned to miscellanous

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 02c5b055a..3537bd36b 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -182,6 +182,11 @@ check_references() {
         family=$(curl -s "https://www.ncbi.nlm.nih.gov/Taxonomy/Browser/wwwtax.cgi?id=${organism_id}" | grep -o 'TITLE="family">.*<' | awk -F 'TITLE="family">' '{print $2}' | cut -d '<' -f 1 | tr '[:upper:]' '[:lower:]')
         if [ -z $family ]; then
             family=$(curl -s "https://www.ncbi.nlm.nih.gov/Taxonomy/Browser/wwwtax.cgi?id=${organism_id}" | grep -o 'ALT="family">.*<' | awk -F 'ALT="family">' '{print $2}' | cut -d '<' -f 1 | tr '[:upper:]' '[:lower:]')
+            if [ -z $family ]; then
+                family="miscellanous"
+                log_message "Reference $ref does not currently belong to any family. Assigned to $family."
+                break
+            fi
         fi
         log_message "Reference $ref belongs to $family family."
     }

From e1c81495f8a0775caef796dd6d86ab45af8351c9 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Fri, 9 Aug 2024 14:57:47 +0200
Subject: [PATCH 149/321] Substituted break by return

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 3537bd36b..727a308bd 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -185,7 +185,7 @@ check_references() {
             if [ -z $family ]; then
                 family="miscellanous"
                 log_message "Reference $ref does not currently belong to any family. Assigned to $family."
-                break
+                return
             fi
         fi
         log_message "Reference $ref belongs to $family family."

From 43fc68e9e5288b1a089846e1567f0bc2802685f8 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Tue, 13 Aug 2024 15:42:26 +0200
Subject: [PATCH 150/321] Changed color to last message

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 727a308bd..12d6c6670 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -528,4 +528,4 @@ rm percentajeNs.py
 rm _02_create_run_percentage_Ns.sh
 cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R1*.fastq.gz %_R1.fastq.gz" | bash; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R2*.fastq.gz %_R2.fastq.gz" | bash; cd ..
 
-log_message "Lablog_viralrecon execution has been completed. Please verify all the configurations are set up correctly." green
+log_message "Lablog_viralrecon execution has been completed. Please verify all the configurations are set up correctly." bold

From 2b08b9c0f54c9150bf3c8dc1d7f4590cea774665 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Wed, 14 Aug 2024 15:49:51 +0200
Subject: [PATCH 151/321] Modified name of gff file (now is named as family)

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 12d6c6670..ff8cdea2e 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -260,7 +260,7 @@ check_references() {
             digest=$(openssl rand -hex 24)
             refgenie alias set --aliases ${family} --digest ${digest} -f -c /data/bi/references/refgenie/genome_config.yaml
             mkdir -p /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/
-            wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${ref}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
+            wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${family}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
             if [ $? -eq 0 ]; then
                 log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}." green
                 log_message "Adding asset for ${ref}.gff file..."
@@ -279,7 +279,7 @@ check_references() {
             log_message "Directory /data/bi/references/refgenie/alias/${family}/ ALREADY EXISTS. Downloading ${ref}.gff."
             digest=$(refgenie alias get -a ${family} -c /data/bi/references/refgenie/genome_config.yaml)
             mkdir -p /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/
-            wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${ref}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
+            wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${family}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
             if [ $? -eq 0 ]; then 
                 log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}." green
                 log_message "Adding asset for ${ref}.gff file..."

From b75d1c18b7e4f2f7814e259c9cf07af5043c89fe Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Wed, 14 Aug 2024 16:03:01 +0200
Subject: [PATCH 152/321] Removed srun from refgenie build and refgenie add in
 order to avoid wrong behaviour of loop at line 471.

---
 .../viralrecon/ANALYSIS/lablog_viralrecon        | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index ff8cdea2e..6477bd408 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -214,8 +214,8 @@ check_references() {
                 log_message "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}." green
                 gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
                 log_message "Building asset for ${ref}.fasta file..."
-                srun --partition short_idx --output ${ref}.fasta_build.log refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R
-                if [ $? -eq 0 ]; then
+                refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R > ${ref}.fasta_build.log 2>&1
+                if grep -q "Created" "${ref}.fasta_build.log"; then
                     log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)" bold
                     bash /data/bi/references/refgenie/alias/ref.sh
                     REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
@@ -234,8 +234,8 @@ check_references() {
                 log_message "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}." green
                 gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
                 log_message "Building asset for ${ref}.fasta file..."
-                srun --partition short_idx --output ${ref}.fasta_build.log refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R
-                if [ $? -eq 0 ]; then
+                refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R > ${ref}.fasta_build.log 2>&1
+                if grep -q "Created" "${ref}.fasta_build.log"; then
                     log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)" bold
                     bash /data/bi/references/refgenie/alias/ref.sh
                     REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
@@ -264,8 +264,8 @@ check_references() {
             if [ $? -eq 0 ]; then
                 log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}." green
                 log_message "Adding asset for ${ref}.gff file..."
-                srun --partition short_idx --output ${ref}.gff_add.log refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
-                if [ $? -eq 0 ]; then
+                refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml > ${ref}.gff_add.log 2>&1
+                if grep -q "Created" "${ref}.gff_add.log"; then
                     log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)" bold
                     bash /data/bi/references/refgenie/alias/ref.sh
                     REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
@@ -283,8 +283,8 @@ check_references() {
             if [ $? -eq 0 ]; then 
                 log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}." green
                 log_message "Adding asset for ${ref}.gff file..."
-                srun --partition short_idx --output ${ref}.gff_add.log refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml
-                if [ $? -eq 0 ]; then
+                refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml > ${ref}.gff_add.log 2>&1
+                if grep -q "Created" "${ref}.gff_add.log"; then
                     log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)" bold
                     bash /data/bi/references/refgenie/alias/ref.sh
                     REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)

From 003a2267b2d244a648f11f86b24829cd5a2aedf1 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Fri, 16 Aug 2024 10:41:23 +0200
Subject: [PATCH 153/321] Added loading stage for micromamba refgenie
 enviroment

---
 .../viralrecon/ANALYSIS/lablog_viralrecon     | 19 +++++++++++++++++++
 1 file changed, 19 insertions(+)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 6477bd408..ec944be38 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -205,6 +205,15 @@ check_references() {
             log_message "SAMtools module not loaded. Exiting..." blk_red
             exit 1
         fi
+        eval "$(micromamba shell hook --shell bash)"
+        micromamba activate refgenie_v0.12.1
+        environment=$(micromamba info | awk '/environment/ && /active/ {print $3}')
+        if [[ $environment == *"refgenie"* ]]; then
+            log_message "$environment environment succesfully activated." green
+        else
+            log_message "Refgenie environment is NOT ACTIVE. Exiting..." blk_red
+            exit 1
+        fi
         if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exists
             log_message "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.fasta in /data/bi/references/refgenie/alias/${family}/fasta/${ref}."
             digest=$(openssl rand -hex 24)
@@ -255,6 +264,16 @@ check_references() {
     if [ -z "$REF_GFF" ]; then
         log_message "File ${ref}.gff is not yet downloaded."
         if [ ! -v family ]; then obtain_family; if [ -z ${family} ]; then return; fi; fi
+        if [[ $environment != *"refgenie"* ]]; then
+            eval "$(micromamba shell hook --shell bash)"
+            micromamba activate refgenie_v0.12.1
+            environment=$(micromamba info | awk '/environment/ && /active/ {print $3}')
+            if [[ $environment == *"refgenie"* ]]; then
+                log_message "$environment environment succesfully activated." green
+            else
+                log_message "Refgenie environment is NOT ACTIVE. Exiting..." blk_red
+            fi
+        fi
         if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exist
             log_message "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.gff in /data/bi/references/refgenie/alias/${family}/gff/${ref}."
             digest=$(openssl rand -hex 24)

From 2f6bfdcea7e3fa80aa2b270d3567c2dcf0278803 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Fri, 16 Aug 2024 10:56:48 +0200
Subject: [PATCH 154/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 35b6a0478..d2dc42510 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -59,6 +59,7 @@ Code contributions to the new version:
 - Fixed IRMA's lablog so that the sequences of the samples are not displayed several times neither in the .txt files of each influenza type nor in all_samples_completo.txt [#305](https://github.com/BU-ISCIII/buisciii-tools/pull/305)
 - Modified bioinfo_doc.py so that new lines in the delivery message are applied in the email [#307](https://github.com/BU-ISCIII/buisciii-tools/pull/307)
 - Added several improvements in lablog_viralrecon (created log files, modified check_references function behaviour, enabled config files regeneration) [#306](https://github.com/BU-ISCIII/buisciii-tools/pull/306)
+- Fixed bug when lablog_viralrecon tries to download references that don't belong to any family. [#310](https://github.com/BU-ISCIII/buisciii-tools/pull/310)
 
 ### Modules
 

From 936df9a1ace69d9a60d2e1079088501ece2feaf8 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 1 Aug 2024 11:29:43 +0200
Subject: [PATCH 155/321] created python for irma vcf

---
 .../04-irma/create_irma_vcf.py                | 712 ++++++++++++++++++
 1 file changed, 712 insertions(+)
 create mode 100644 bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
new file mode 100644
index 000000000..bf909cb60
--- /dev/null
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -0,0 +1,712 @@
+# imports
+from Bio import SeqIO
+import statistics
+import argparse
+import sys
+
+
+def parse_args(args=None):
+    Description = "Convert alignment between IRMA consensus and reference fasta to VCF file using IRMA stats"
+    Epilog = """Example usage: python create_irma_vcf.py -a <alignment> -i <irma_alleles> -o <out_vcf>"""
+
+    parser = argparse.ArgumentParser(description=Description, epilog=Epilog)
+    parser.add_argument(
+        "-a",
+        "--alignment",
+        type=str,
+        required=True,
+        help="Alignment file",
+    )
+    parser.add_argument(
+        "-i",
+        "--irma_alleles",
+        type=str,
+        required=True,
+        help="IRMA allAlleles.txt file",
+    )
+    parser.add_argument(
+        "-o",
+        "--out_vcf",
+        type=str,
+        required=True,
+        help="Output vcf file",
+    )
+    return parser.parse_args(args)
+
+
+def alleles_to_dict(alleles_file):
+    """Convert IRMA's allAlleles file to dictionary.
+
+    Parameters
+    ----------
+    alleles_file : str
+        Path to the alleles file.
+
+    Returns
+    -------
+    alleles_dict
+        Dictionary containing alleles information with positions as keys.
+	E.g:
+	{
+	  1: {
+            'Reference_Name': 'rsv_a2',
+            'Position': '1',
+            'Allele': 'A',
+            'Count': '2',
+            'Total': '2',
+            'Frequency': '1',
+            'Average_Quality': '29.5',
+            'ConfidenceNotMacErr': '0.998877981545698',
+            'PairedUB': '1',
+            'QualityUB': '1',
+            'Allele_Type': 'Consensus'
+           }
+	}
+    """
+
+    alleles_dict = {}
+    with open(alleles_file, "r") as file:
+        header = file.readline().strip().split('\t')
+        for line in file:
+            while line.count('\t') < len(header) - 1:
+                line += file.readline()
+            line_data = line.strip().split('\t')
+            position = int(line_data[1])
+            allele_type = line_data[10]
+            if allele_type == "Consensus":
+                entry_dict = {header[i]: line_data[i] for i in range(len(header))}
+                alleles_dict[position] = entry_dict
+    return alleles_dict
+
+
+def align2dict(alignment_file):
+    """Convert alignment file to dictionary.
+
+    Parameters
+    ----------
+    alignment_file : str
+        Path to the alignment file in fasta format.
+
+    Returns
+    -------
+    vcf_dict
+        Dictionary containing alignment information with alignment positions as keys.
+        E.g.:
+        {
+            "10": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 1,
+                "SAMPLE_POS": [
+                    8,
+                    9
+                ],
+                "REF": "A",
+                "ALT": "AAA",
+                "TYPE": "INS"
+            },
+            "19": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 10,
+                "SAMPLE_POS": [
+                    19
+                ],
+                "REF": "T",
+                "ALT": "A",
+                "TYPE": "SNP"
+            },
+            "7542": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 7531,
+                "SAMPLE_POS": [
+                    7542
+                ],
+                "REF": "T",
+                "ALT": "TT",
+                "TYPE": "INS"
+            },
+            "7543": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 7531,
+                "SAMPLE_POS": [
+                    7543
+                ],
+                "REF": "T",
+                "ALT": "TC",
+                "TYPE": "INS"
+            },
+            "7544": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 7531,
+                "SAMPLE_POS": [
+                    7544
+                ],
+                "REF": "C",
+                "ALT": "CA",
+                "TYPE": "INS"
+            },
+            "10081": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 10068,
+                "SAMPLE_POS": [
+                    10079
+                ],
+                "REF": "AA",
+                "ALT": "A",
+                "TYPE": "DEL"
+            },
+            "10082": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 10069,
+                "SAMPLE_POS": [
+                    10079
+                ],
+                "REF": "-C",
+                "ALT": "-",
+                "TYPE": "DEL"
+            },
+            "10083": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 10070,
+                "SAMPLE_POS": [
+                    10079
+                ],
+                "REF": "-T",
+                "ALT": "-",
+                "TYPE": "DEL"
+            }
+        }
+    """
+    sequences_dict = {}
+    with open(alignment_file, "r") as alignment:
+        for sequence in SeqIO.parse(alignment, "fasta"):
+            sequences_dict[sequence.id] = str(sequence.seq)
+    sample_id, sample_seq = list(sequences_dict.items())[0]
+    ref_id, ref_seq = list(sequences_dict.items())[1]
+    sample_position = 0
+    ref_position = 0
+    vcf_dict = {}
+    CHROM = ref_id
+    ALT = ""
+    SAMPLE_POS = []
+    for i, (sample_base, ref_base) in enumerate(zip(sample_seq, ref_seq)):
+        align_position = i + 1
+        if sample_base != "-":
+            sample_position += 1
+        if ref_base != "-":
+            ref_position += 1
+        if ref_base == "-" and sample_base != "N":
+            if ref_position == 0:
+                ALT += sample_base
+                SAMPLE_POS.append(sample_position)
+            else:
+                content_dict = {
+                    "CHROM": CHROM,
+                    "REF_POS": ref_position,
+                    "SAMPLE_POS": [sample_position],
+                    "REF": sample_seq[i-1],
+                    "ALT": sample_seq[i-1] + sample_base,
+                    "TYPE": "INS"
+                }
+                vcf_dict[align_position] = content_dict
+        elif ref_position == 1 and len(SAMPLE_POS) > 1:
+            content_dict = {
+                "CHROM": CHROM,
+                "REF_POS": ref_position,
+                "SAMPLE_POS": SAMPLE_POS,
+                "REF": ref_base,
+                "ALT": ALT + sample_base,
+                "TYPE": "INS"
+            }
+            vcf_dict[align_position] = content_dict
+        elif sample_base == "-" and ref_base != "N":
+            content_dict = {
+                "CHROM": CHROM,
+                "REF_POS": ref_position-1,
+                "SAMPLE_POS": [sample_position],
+                "REF": sample_seq[i-1] + ref_base,
+                "ALT": sample_seq[i-1],
+                "TYPE": "DEL"
+            }
+            vcf_dict[align_position] = content_dict
+        elif ref_base != sample_base and ref_base != "N" and ref_base != "-" and sample_base != "N" and sample_base != "-":
+            content_dict = {
+                "CHROM": CHROM,
+                "REF_POS": ref_position,
+                "SAMPLE_POS": [sample_position],
+                "REF": ref_base,
+                "ALT": sample_base,
+                "TYPE": "SNP"
+            }
+            vcf_dict[align_position] = content_dict
+    return vcf_dict
+
+
+def stats_vcf(vcf_dictionary, alleles_dictionary):
+    """Add stats to VCF dictionary.
+
+    Parameters
+    ----------
+    vcf_dictionary : dict
+        Dictionary containing VCF information.
+    alleles_dictionary : dict
+        Dictionary containing alleles information.
+
+    Returns
+    -------
+    af_vcf_dict
+        Updated dictionary with allele frequencies and other metrics.
+        E.g:
+        {
+            "10": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 1,
+                "SAMPLE_POS": [
+                    8,
+                    9
+                ],
+                "REF": "A",
+                "ALT": "AAA",
+                "TYPE": "INS",
+                "DP": [
+                    "9"
+                ],
+                "AF": [
+                    "1"
+                ],
+                "QUAL": [
+                    "33.7777777777778"
+                ]
+            },
+            "19": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 10,
+                "SAMPLE_POS": [
+                    19
+                ],
+                "REF": "T",
+                "ALT": "A",
+                "TYPE": "SNP",
+                "DP": [
+                    "60"
+                ],
+                "AF": [
+                    "0.833333333333333"
+                ],
+                "QUAL": [
+                    "34.0166666666667"
+                ]
+            },
+            "7542": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 7531,
+                "SAMPLE_POS": [
+                    7542
+                ],
+                "REF": "T",
+                "ALT": "TT",
+                "TYPE": "INS",
+                "DP": [
+                    "74"
+                ],
+                "AF": [
+                    "0.986666666666667"
+                ],
+                "QUAL": [
+                    "34.8648648648649"
+                ]
+            },
+            "7543": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 7531,
+                "SAMPLE_POS": [
+                    7543
+                ],
+                "REF": "T",
+                "ALT": "TC",
+                "TYPE": "INS",
+                "DP": [
+                    "75"
+                ],
+                "AF": [
+                    "1"
+                ],
+                "QUAL": [
+                    "35.04"
+                ]
+            },
+            "7544": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 7531,
+                "SAMPLE_POS": [
+                    7544
+                ],
+                "REF": "C",
+                "ALT": "CA",
+                "TYPE": "INS",
+                "DP": [
+                    "75"
+                ],
+                "AF": [
+                    "1"
+                ],
+                "QUAL": [
+                    "33.8533333333333"
+                ]
+            },
+            "10081": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 10068,
+                "SAMPLE_POS": [
+                    10079
+                ],
+                "REF": "AA",
+                "ALT": "A",
+                "TYPE": "DEL",
+                "DP": [
+                    "10"
+                ],
+                "AF": [
+                    "1"
+                ],
+                "QUAL": [
+                    "34.3"
+                ]
+            },
+            "10082": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 10069,
+                "SAMPLE_POS": [
+                    10079
+                ],
+                "REF": "-C",
+                "ALT": "-",
+                "TYPE": "DEL",
+                "DP": [
+                    "10"
+                ],
+                "AF": [
+                    "1"
+                ],
+                "QUAL": [
+                    "34.3"
+                ]
+            },
+            "10083": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 10070,
+                "SAMPLE_POS": [
+                    10079
+                ],
+                "REF": "-T",
+                "ALT": "-",
+                "TYPE": "DEL",
+                "DP": [
+                    "10"
+                ],
+                "AF": [
+                    "1"
+                ],
+                "QUAL": [
+                    "34.3"
+                ]
+            }
+        }
+    """
+    af_vcf_dict = {}
+    for key, value in vcf_dictionary.items():
+        DP = []
+        AF = []
+        QUAL = []
+        content_dict = {
+            "CHROM": value["CHROM"],
+            "REF_POS": value["REF_POS"],
+            "SAMPLE_POS": value["SAMPLE_POS"],
+            "REF": value["REF"],
+            "ALT": value["ALT"],
+            "TYPE": value["TYPE"]
+        }
+        for position in value["SAMPLE_POS"]:
+            if position in alleles_dictionary:
+                alleles_info = alleles_dictionary[position]
+                if alleles_info["Allele"] == value["ALT"] or value["TYPE"] in ["INS", "DEL"]:
+                    DP.append(alleles_info["Count"])
+                    AF.append(alleles_info["Frequency"])
+                    QUAL.append(alleles_info["Average_Quality"])
+                    break
+                else:
+                    print("SNP not the same in .fasta file and alleles file")
+                    print(value)
+                    print(alleles_info)
+            else:
+                print("Position not detected in allele file!")
+                print("Position")
+                print(value["SAMPLE_POS"])
+                print(value)
+        content_dict.update({"DP": DP, "AF": AF, "QUAL": QUAL})
+        af_vcf_dict[key] = content_dict
+    return af_vcf_dict
+
+
+def combine_indels(vcf_dictionary):
+    """Combine insertion and deletion pñositons in the VCF dictionary.
+
+    Parameters
+    ----------
+    vcf_dictionary : dict
+        Dictionary containing VCF information.
+
+    Returns
+    -------
+    combined_vcf_dict
+        Updated dictionary with combined insertion and deletion variants.
+        {
+            "1": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 1,
+                "SAMPLE_POS": [
+                    8,
+                    9
+                ],
+                "REF": "A",
+                "ALT": "AAA",
+                "DP": [
+                    "9"
+                ],
+                "AF": [
+                    "1"
+                ],
+                "QUAL": [
+                    "33.7777777777778"
+                ],
+                "TYPE": "INS"
+            },
+            "10": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 10,
+                "SAMPLE_POS": [
+                    19
+                ],
+                "REF": "T",
+                "ALT": "A",
+                "DP": [
+                    "60"
+                ],
+                "AF": [
+                    "0.833333333333333"
+                ],
+                "QUAL": [
+                    "34.0166666666667"
+                ],
+                "TYPE": "SNP"
+            },
+            "7531": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 7531,
+                "SAMPLE_POS": [
+                    7542,
+                    7543,
+                    7544
+                ],
+                "REF": "T",
+                "ALT": "TTCA",
+                "DP": [
+                    "74",
+                    "75",
+                    "75"
+                ],
+                "AF": [
+                    "0.986666666666667",
+                    "1",
+                    "1"
+                ],
+                "QUAL": [
+                    "34.8648648648649",
+                    "35.04",
+                    "33.8533333333333"
+                ],
+                "TYPE": "INS"
+            },
+            "10068": {
+                "CHROM": "EPI_ISL_18668201",
+                "REF_POS": 10068,
+                "SAMPLE_POS": [
+                    10079
+                ],
+                "REF": "AACT",
+                "ALT": "A",
+                "DP": [
+                    "10"
+                ],
+                "AF": [
+                    "1"
+                ],
+                "QUAL": [
+                    "34.3"
+                ],
+                "TYPE": "DEL"
+            }
+        }
+
+    """
+    combined_vcf_dict = {}
+    for key, value in vcf_dictionary.items():
+        content_dict = {
+            "CHROM": value["CHROM"],
+            "REF_POS": value["REF_POS"],
+            "SAMPLE_POS": value["SAMPLE_POS"],
+            "REF": value["REF"],
+            "ALT": value["ALT"],
+            "DP": value["DP"],
+            "AF": value["AF"],
+            "QUAL": value["QUAL"],
+            "TYPE": value["TYPE"]
+        }
+        if value["TYPE"] == "INS":
+            if value["REF_POS"] in combined_vcf_dict:
+                if value["TYPE"] == combined_vcf_dict[value["REF_POS"]]["TYPE"]:
+                    NEW_ALT = value["ALT"].replace(value["REF"], "")
+                    combined_vcf_dict[value["REF_POS"]]["ALT"] += NEW_ALT
+                    combined_vcf_dict[value["REF_POS"]]["SAMPLE_POS"].append(value["SAMPLE_POS"][0])
+                    combined_vcf_dict[value["REF_POS"]]["DP"].append(value["DP"][0])
+                    combined_vcf_dict[value["REF_POS"]]["AF"].append(value["AF"][0])
+                    combined_vcf_dict[value["REF_POS"]]["QUAL"].append(value["QUAL"][0])
+                else:
+                    print("Same position annotated with multiple variant types")
+                    print("value")
+                    print(value)
+                    print("combined_vcf_dict")
+                    print(combined_vcf_dict[value["REF_POS"]])
+            else:
+                combined_vcf_dict[value["REF_POS"]] = content_dict
+        elif value["TYPE"] == "DEL":
+            sample_found = False
+            for pos, data in combined_vcf_dict.items():
+                var_type = data["TYPE"]
+                if var_type == "DEL":
+                    if value["SAMPLE_POS"] == data["SAMPLE_POS"]:
+                        if value["TYPE"] == var_type:
+                            sample_found = data["REF_POS"]
+                            break
+                        else:
+                            print("Same position annotated with multiple variant types")
+                            print("value")
+                            print(value)
+                            print("combined_vcf_dict")
+                            print(combined_vcf_dict[value["REF_POS"]])
+            if sample_found:
+                NEW_REF = value["REF"].replace(value["ALT"], "")
+                combined_vcf_dict[sample_found]["REF"] += NEW_REF
+            else:
+                combined_vcf_dict[value["REF_POS"]] = content_dict
+        elif value["TYPE"] == "SNP":
+            if value["REF_POS"] in combined_vcf_dict:
+                if value["TYPE"] == combined_vcf_dict[value["REF_POS"]]["TYPE"]:
+                    print("Repeated SNP!!!")
+                else:
+                    print("Same position annotated with multiple variant types")
+                    print("value")
+                    print(value)
+                    print("combined_vcf_dict")
+                    print(combined_vcf_dict[value["REF_POS"]])
+            else:
+                combined_vcf_dict[value["REF_POS"]] = content_dict
+        else:
+            print("Different annotation type found")
+    return combined_vcf_dict
+
+
+def get_vcf_header(chromosome, sample_name):
+    """Create the VCF header for VCFv4.2
+
+    Parameters
+    ----------
+    chromosome : str
+        Chromosome name.
+    sample_name : str
+        Sample name.
+
+    Returns
+    -------
+    header
+        String containing all the VCF header lines separated by newline.
+    """
+    # Define VCF header
+    header_source = ["##fileformat=VCFv4.2", "##source=custom"]
+    header_contig = []
+    if chromosome:
+        header_contig += [
+            "##contig=<ID=" + chromosome + ">"
+        ]
+        header_source += header_contig
+
+    header_info = [
+        '##INFO=<ID=TYPE,Number=1,Type=String,Description="Either SNP (Single Nucleotide Polymorphism), DEL (deletion) or INS (Insertion)">',
+    ]
+    header_format = [
+        '##FORMAT=<ID=DP,Number=1,Type=Integer,Description="Depth of alternate base">',
+        '##FORMAT=<ID=AF,Number=1,Type=Float,Description="Frequency of alternate base">',
+    ]
+    columns = [
+        '#CHROM\tPOS\tREF\tALT\tQUAL\tINFO\tFORMAT\t' + sample_name
+    ]
+    header = header_source + header_info + header_format + columns
+    return header
+
+
+def create_vcf(variants_dict, out_vcf, alignment):
+    """Create VCF file from variants dictionary.
+
+    Parameters
+    ----------
+    variants_dict : dict
+        Dictionary containing variants information.
+    out_vcf : str
+        Path to the output VCF file.
+    alignment : str
+        Path to the alignment file.
+
+    Returns
+    -------
+    None
+    """
+
+    chrom = next(iter(variants_dict.values()))["CHROM"]
+    sample = alignment.replace(".align.fasta", "")
+    vcf_header = "\n".join(get_vcf_header(chrom, sample))
+    FORMAT = "DP:AF"
+    with open(out_vcf, "w") as file_out:
+        file_out.write(vcf_header + "\n")
+        for key, value in variants_dict.items():
+            CHROM = value["CHROM"]
+            POS = value["REF_POS"]
+            REF = value["REF"]
+            ALT = value["ALT"]
+            QUAL_list = [float(number) for number in value["QUAL"]]
+            QUAL = str(round(statistics.mean(QUAL_list), 2))
+            INFO = "TYPE=" + value["TYPE"]
+            DP_list = [int(number) for number in value["DP"]]
+            AF_list = [float(number) for number in value["AF"]]
+            SAMPLE = str(round(statistics.mean(DP_list))) + ':' + str(round(statistics.mean(AF_list), 4))
+            oline = CHROM + '\t' + str(POS) + '\t' + REF + '\t' + ALT + '\t' + str("".join(QUAL)) + '\t' + INFO + '\t' + FORMAT + '\t' + SAMPLE
+            file_out.write(oline + "\n")
+
+
+def main(args=None):
+    # Process args
+    args = parse_args(args)
+
+    # Initialize vars
+    alignment = args.alignment
+    all_alleles = args.irma_alleles
+    output_vcf = args.out_vcf
+
+    # Start analysis
+    alleles_dict = alleles_to_dict(all_alleles)
+    alignment_dict = align2dict(alignment)
+    af_vcf_dict = stats_vcf(alignment_dict, alleles_dict)
+    combined_vcf_dict = combine_indels(af_vcf_dict)
+    create_vcf(combined_vcf_dict, output_vcf, alignment)
+
+
+if __name__ == "__main__":
+    sys.exit(main())

From 84ab72bba8be324c5913759dda57d24fdecca02a Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 1 Aug 2024 11:52:42 +0200
Subject: [PATCH 156/321] @saramonzon changes to add minority variants WIP

---
 .../04-irma/create_irma_vcf.py                | 157 +++++++++++-------
 1 file changed, 101 insertions(+), 56 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index bf909cb60..e9b09e6d3 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -45,23 +45,48 @@ def alleles_to_dict(alleles_file):
     Returns
     -------
     alleles_dict
-        Dictionary containing alleles information with positions as keys.
-	E.g:
-	{
-	  1: {
-            'Reference_Name': 'rsv_a2',
-            'Position': '1',
-            'Allele': 'A',
-            'Count': '2',
-            'Total': '2',
-            'Frequency': '1',
-            'Average_Quality': '29.5',
-            'ConfidenceNotMacErr': '0.998877981545698',
-            'PairedUB': '1',
-            'QualityUB': '1',
-            'Allele_Type': 'Consensus'
-           }
-	}
+        Dictionary containing alleles information with chrom+positions+allele as key. e.g.
+        {
+            "rsv_a2_1_A": {
+                "Reference_Name": "rsv_a2",
+                "Position": "1",
+                "Allele": "A",
+                "Count": "2",
+                "Total": "2",
+                "Frequency": "1",
+                "Average_Quality": "29.5",
+                "ConfidenceNotMacErr": "0.998877981545698",
+                "PairedUB": "1",
+                "QualityUB": "1",
+                "Allele_Type": "Consensus"
+            },
+            "rsv_a2_2204_A": {
+                "Reference_Name": "rsv_a2",
+                "Position": "2204",
+                "Allele": "A",
+                "Count": "6532",
+                "Total": "15323",
+                "Frequency": "0.426287280558637",
+                "Average_Quality": "34.5708818126148",
+                "ConfidenceNotMacErr": "0.999181140401206",
+                "PairedUB": "0.00396999257813604",
+                "QualityUB": "0.0010642711614851",
+                "Allele_Type": "Minority"
+            },
+            "rsv_a2_2204_G": {
+                "Reference_Name": "rsv_a2",
+                "Position": "2204",
+                "Allele": "G",
+                "Count": "8768",
+                "Total": "15323",
+                "Frequency": "0.5722117078901",
+                "Average_Quality": "35.0286268248175",
+                "ConfidenceNotMacErr": "0.999450989591763",
+                "PairedUB": "0.00396999257813604",
+                "QualityUB": "0.00100698799816366",
+                "Allele_Type": "Consensus"
+            },
+        }
     """
 
     alleles_dict = {}
@@ -72,10 +97,11 @@ def alleles_to_dict(alleles_file):
                 line += file.readline()
             line_data = line.strip().split('\t')
             position = int(line_data[1])
-            allele_type = line_data[10]
-            if allele_type == "Consensus":
+            variant_af = float(line_data[5])
+            if variant_af > 0.25:
                 entry_dict = {header[i]: line_data[i] for i in range(len(header))}
-                alleles_dict[position] = entry_dict
+                variant = str(line_data[0]) + "_" + str(position) + "_" + str(line_data[2])
+                alleles_dict[variant] = entry_dict
     return alleles_dict
 
 
@@ -104,15 +130,15 @@ def align2dict(alignment_file):
                 "ALT": "AAA",
                 "TYPE": "INS"
             },
-            "19": {
+            "11": {
                 "CHROM": "EPI_ISL_18668201",
-                "REF_POS": 10,
+                "REF_POS": 2,
                 "SAMPLE_POS": [
-                    19
+                    11
                 ],
-                "REF": "T",
+                "REF": "A",
                 "ALT": "A",
-                "TYPE": "SNP"
+                "TYPE": "REF"
             },
             "7542": {
                 "CHROM": "EPI_ISL_18668201",
@@ -238,6 +264,16 @@ def align2dict(alignment_file):
                 "TYPE": "SNP"
             }
             vcf_dict[align_position] = content_dict
+        elif ref_base != "N" and ref_base != "-" and sample_base != "N" and sample_base != "-":
+            content_dict = {
+                "CHROM": CHROM,
+                "REF_POS": ref_position,
+                "SAMPLE_POS": [sample_position],
+                "REF": ref_base,
+                "ALT": sample_base,
+                "TYPE": "REF"
+            }
+            vcf_dict[align_position] = content_dict
     return vcf_dict
 
 
@@ -257,7 +293,7 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
         Updated dictionary with allele frequencies and other metrics.
         E.g:
         {
-            "10": {
+            "EPI_ISL_18668201_1_AAA": {
                 "CHROM": "EPI_ISL_18668201",
                 "REF_POS": 1,
                 "SAMPLE_POS": [
@@ -268,13 +304,16 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                 "ALT": "AAA",
                 "TYPE": "INS",
                 "DP": [
-                    "9"
+                    "9",
+                    "10"
                 ],
                 "AF": [
+                    "1",
                     "1"
                 ],
                 "QUAL": [
-                    "33.7777777777778"
+                    "33.7777777777778",
+                    "34"
                 ]
             },
             "19": {
@@ -413,37 +452,43 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
         }
     """
     af_vcf_dict = {}
-    for key, value in vcf_dictionary.items():
-        DP = []
-        AF = []
-        QUAL = []
-        content_dict = {
-            "CHROM": value["CHROM"],
-            "REF_POS": value["REF_POS"],
-            "SAMPLE_POS": value["SAMPLE_POS"],
-            "REF": value["REF"],
-            "ALT": value["ALT"],
-            "TYPE": value["TYPE"]
-        }
-        for position in value["SAMPLE_POS"]:
-            if position in alleles_dictionary:
-                alleles_info = alleles_dictionary[position]
-                if alleles_info["Allele"] == value["ALT"] or value["TYPE"] in ["INS", "DEL"]:
-                    DP.append(alleles_info["Count"])
-                    AF.append(alleles_info["Frequency"])
-                    QUAL.append(alleles_info["Average_Quality"])
-                    break
+    for _, value in alleles_dictionary.items():
+        pos = value["Position"]
+        for _, subdict in vcf_dictionary.items():
+            if value["Allele_Type"] == "Consensus" and subdict["TYPE"] == "REF":
+                continue
+            if 'SAMPLE_POS' in subdict and int(pos) in subdict['SAMPLE_POS']:
+                DP = []
+                AF = []
+                QUAL = []
+                content_dict = {
+                    "CHROM": subdict["CHROM"],
+                    "REF_POS": subdict["REF_POS"],
+                    "SAMPLE_POS": subdict["SAMPLE_POS"],
+                    "REF": subdict["REF"],
+                    "ALT": subdict["ALT"],
+                    "TYPE": subdict["TYPE"]
+                }
+                if value["Allele"] == content_dict["ALT"] or value["Allele_Type"] == "Minority" or content_dict["TYPE"] in ["INS", "DEL", "REF"]:
+                    DP.append(value["Count"])
+                    AF.append(value["Frequency"])
+                    QUAL.append(value["Average_Quality"])
                 else:
                     print("SNP not the same in .fasta file and alleles file")
                     print(value)
-                    print(alleles_info)
-            else:
-                print("Position not detected in allele file!")
-                print("Position")
-                print(value["SAMPLE_POS"])
-                print(value)
-        content_dict.update({"DP": DP, "AF": AF, "QUAL": QUAL})
-        af_vcf_dict[key] = content_dict
+                    print(content_dict)
+
+                content_dict.update({"DP": DP, "AF": AF, "QUAL": QUAL})
+                variant = content_dict["CHROM"] + "_" + str(content_dict["REF_POS"]) + "_" + content_dict["ALT"]
+
+                if variant in af_vcf_dict:
+                    af_vcf_dict[variant]["DP"] += DP
+                    af_vcf_dict[variant]["AF"] += AF
+                    af_vcf_dict[variant]["QUAL"] += QUAL
+                else:
+                    af_vcf_dict[variant] = content_dict
+                break
+
     return af_vcf_dict
 
 

From fc748cad49394270707da2e4dd379ad09c3672b0 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 1 Aug 2024 11:57:00 +0200
Subject: [PATCH 157/321] Added frequency and depth as parameter filters

---
 .../04-irma/create_irma_vcf.py                | 25 ++++++++++++++++---
 1 file changed, 22 insertions(+), 3 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index e9b09e6d3..03a3f1c7a 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -31,10 +31,26 @@ def parse_args(args=None):
         required=True,
         help="Output vcf file",
     )
+    parser.add_argument(
+        "-f",
+        "--frequency",
+        type=float,
+        default=0.25,
+        required=True,
+        help="Minimum Allele Frequency for a variant to be included in the .vcf file. Default 0.25.",
+    )
+    parser.add_argument(
+        "-d",
+        "--depth",
+        type=int,
+        default=10,
+        required=True,
+        help="Minimum depth for a variant to be included in the .vcf file. Default 10X.",
+    )
     return parser.parse_args(args)
 
 
-def alleles_to_dict(alleles_file):
+def alleles_to_dict(alleles_file, frequency, depth):
     """Convert IRMA's allAlleles file to dictionary.
 
     Parameters
@@ -98,7 +114,8 @@ def alleles_to_dict(alleles_file):
             line_data = line.strip().split('\t')
             position = int(line_data[1])
             variant_af = float(line_data[5])
-            if variant_af > 0.25:
+            position_dp = float(line_data[4])
+            if variant_af >= frequency and position_dp >= depth:
                 entry_dict = {header[i]: line_data[i] for i in range(len(header))}
                 variant = str(line_data[0]) + "_" + str(position) + "_" + str(line_data[2])
                 alleles_dict[variant] = entry_dict
@@ -744,9 +761,11 @@ def main(args=None):
     alignment = args.alignment
     all_alleles = args.irma_alleles
     output_vcf = args.out_vcf
+    freq = args.frequency
+    dp = args.depth
 
     # Start analysis
-    alleles_dict = alleles_to_dict(all_alleles)
+    alleles_dict = alleles_to_dict(all_alleles, freq, dp)
     alignment_dict = align2dict(alignment)
     af_vcf_dict = stats_vcf(alignment_dict, alleles_dict)
     combined_vcf_dict = combine_indels(af_vcf_dict)

From ac9dcce7f081fb7e0226992086785b5d72c37017 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 1 Aug 2024 12:05:23 +0200
Subject: [PATCH 158/321] Added TOTAL_DP to stats

---
 .../04-irma/create_irma_vcf.py                   | 16 +++++++++-------
 1 file changed, 9 insertions(+), 7 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index 03a3f1c7a..e18d25eb3 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -476,6 +476,7 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                 continue
             if 'SAMPLE_POS' in subdict and int(pos) in subdict['SAMPLE_POS']:
                 DP = []
+                TOTAL_DP = []
                 AF = []
                 QUAL = []
                 content_dict = {
@@ -494,12 +495,12 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                     print("SNP not the same in .fasta file and alleles file")
                     print(value)
                     print(content_dict)
-
-                content_dict.update({"DP": DP, "AF": AF, "QUAL": QUAL})
+                content_dict.update({"DP": DP, "TOTAL_DP": TOTAL_DP, "AF": AF, "QUAL": QUAL})
                 variant = content_dict["CHROM"] + "_" + str(content_dict["REF_POS"]) + "_" + content_dict["ALT"]
 
                 if variant in af_vcf_dict:
                     af_vcf_dict[variant]["DP"] += DP
+                    af_vcf_dict[variant]["TOTAL_DP"] += TOTAL_DP
                     af_vcf_dict[variant]["AF"] += AF
                     af_vcf_dict[variant]["QUAL"] += QUAL
                 else:
@@ -610,6 +611,7 @@ def combine_indels(vcf_dictionary):
         }
 
     """
+
     combined_vcf_dict = {}
     for key, value in vcf_dictionary.items():
         content_dict = {
@@ -619,6 +621,7 @@ def combine_indels(vcf_dictionary):
             "REF": value["REF"],
             "ALT": value["ALT"],
             "DP": value["DP"],
+            "TOTAL_DP": value["TOTAL_DP"],
             "AF": value["AF"],
             "QUAL": value["QUAL"],
             "TYPE": value["TYPE"]
@@ -630,6 +633,7 @@ def combine_indels(vcf_dictionary):
                     combined_vcf_dict[value["REF_POS"]]["ALT"] += NEW_ALT
                     combined_vcf_dict[value["REF_POS"]]["SAMPLE_POS"].append(value["SAMPLE_POS"][0])
                     combined_vcf_dict[value["REF_POS"]]["DP"].append(value["DP"][0])
+                    combined_vcf_dict[value["REF_POS"]]["TOTAL_DP"].append(value["TOTAL_DP"][0])
                     combined_vcf_dict[value["REF_POS"]]["AF"].append(value["AF"][0])
                     combined_vcf_dict[value["REF_POS"]]["QUAL"].append(value["QUAL"][0])
                 else:
@@ -692,7 +696,7 @@ def get_vcf_header(chromosome, sample_name):
     header
         String containing all the VCF header lines separated by newline.
     """
-    # Define VCF header
+
     header_source = ["##fileformat=VCFv4.2", "##source=custom"]
     header_contig = []
     if chromosome:
@@ -743,10 +747,8 @@ def create_vcf(variants_dict, out_vcf, alignment):
             POS = value["REF_POS"]
             REF = value["REF"]
             ALT = value["ALT"]
-            QUAL_list = [float(number) for number in value["QUAL"]]
-            QUAL = str(round(statistics.mean(QUAL_list), 2))
-            INFO = "TYPE=" + value["TYPE"]
-            DP_list = [int(number) for number in value["DP"]]
+            TOTAL_DP_list = [int(number) for number in value["TOTAL_DP"]]
+            INFO = "TYPE=" + value["TYPE"] + ';' + "DP=" + str(round(statistics.mean(TOTAL_DP_list)))
             AF_list = [float(number) for number in value["AF"]]
             SAMPLE = str(round(statistics.mean(DP_list))) + ':' + str(round(statistics.mean(AF_list), 4))
             oline = CHROM + '\t' + str(POS) + '\t' + REF + '\t' + ALT + '\t' + str("".join(QUAL)) + '\t' + INFO + '\t' + FORMAT + '\t' + SAMPLE

From 0673ef949cca539380a44d8238afc1e7b43c27b7 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 1 Aug 2024 12:06:23 +0200
Subject: [PATCH 159/321] Updated VCF data to fit in VCFv4.2 format

---
 .../04-irma/create_irma_vcf.py                | 32 +++++++++++++++----
 1 file changed, 25 insertions(+), 7 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index e18d25eb3..44f7b945d 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -707,15 +707,21 @@ def get_vcf_header(chromosome, sample_name):
 
     header_info = [
         '##INFO=<ID=TYPE,Number=1,Type=String,Description="Either SNP (Single Nucleotide Polymorphism), DEL (deletion) or INS (Insertion)">',
+        '##INFO=<ID=DP,Number=1,Type=Integer,Description="Total Depth">'
+    ]
+    header_filter = [
+        '##FILTER=<ID=PASS,Description="All filters passed">',
     ]
     header_format = [
-        '##FORMAT=<ID=DP,Number=1,Type=Integer,Description="Depth of alternate base">',
-        '##FORMAT=<ID=AF,Number=1,Type=Float,Description="Frequency of alternate base">',
+        '##FORMAT=<ID=GT,Number=1,Type=String,Description="Genotype">',
+        '##FORMAT=<ID=ALT_DP,Number=1,Type=Integer,Description="Depth of alternate base">',
+        '##FORMAT=<ID=ALT_QUAL,Number=1,Type=Integer,Description="Mean quality of alternate base">',
+        '##FORMAT=<ID=ALT_FREQ,Number=1,Type=Float,Description="Frequency of alternate base">',
     ]
     columns = [
-        '#CHROM\tPOS\tREF\tALT\tQUAL\tINFO\tFORMAT\t' + sample_name
+        '#CHROM\tPOS\tID\tREF\tALT\tQUAL\tFILTER\tINFO\tFORMAT\t' + sample_name
     ]
-    header = header_source + header_info + header_format + columns
+    header = header_source + header_info + header_filter + header_format + columns
     return header
 
 
@@ -739,7 +745,11 @@ def create_vcf(variants_dict, out_vcf, alignment):
     chrom = next(iter(variants_dict.values()))["CHROM"]
     sample = alignment.replace(".align.fasta", "")
     vcf_header = "\n".join(get_vcf_header(chrom, sample))
-    FORMAT = "DP:AF"
+    FORMAT = "GT:ALT_DP:ALT_QUAL:ALT_FREQ"
+    ID = "."
+    QUAL = "."
+    FILTER = "PASS"
+    GT = "1"
     with open(out_vcf, "w") as file_out:
         file_out.write(vcf_header + "\n")
         for key, value in variants_dict.items():
@@ -749,9 +759,17 @@ def create_vcf(variants_dict, out_vcf, alignment):
             ALT = value["ALT"]
             TOTAL_DP_list = [int(number) for number in value["TOTAL_DP"]]
             INFO = "TYPE=" + value["TYPE"] + ';' + "DP=" + str(round(statistics.mean(TOTAL_DP_list)))
+            ALT_QUAL_list = []
+            for number in value["QUAL"]:
+                if number != "NA":
+                    ALT_QUAL_list.append(float(number))
+                    ALT_QUAL = str(round(statistics.mean(ALT_QUAL_list), 2))
+                else:
+                    ALT_QUAL = "NA"
+            ALT_DP_list = [int(number) for number in value["DP"]]
             AF_list = [float(number) for number in value["AF"]]
-            SAMPLE = str(round(statistics.mean(DP_list))) + ':' + str(round(statistics.mean(AF_list), 4))
-            oline = CHROM + '\t' + str(POS) + '\t' + REF + '\t' + ALT + '\t' + str("".join(QUAL)) + '\t' + INFO + '\t' + FORMAT + '\t' + SAMPLE
+            SAMPLE = GT + ':' + str(round(statistics.mean(ALT_DP_list))) + ':' + ALT_QUAL + ':' + str(round(statistics.mean(AF_list), 4))
+            oline = CHROM + '\t' + str(POS) + '\t' + ID + '\t' + REF + '\t' + ALT + '\t' + QUAL + '\t' + FILTER + '\t' + INFO + '\t' + FORMAT + '\t' + SAMPLE
             file_out.write(oline + "\n")
 
 

From 3254106accc6ad22d8665b50a8207d51876f486f Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 1 Aug 2024 12:07:34 +0200
Subject: [PATCH 160/321] Exclude reference alles in both alignment and stats
 files

---
 .../ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py  | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index 44f7b945d..218e6b49a 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -468,11 +468,12 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
             }
         }
     """
+
     af_vcf_dict = {}
     for _, value in alleles_dictionary.items():
         pos = value["Position"]
-        for _, subdict in vcf_dictionary.items():
-            if value["Allele_Type"] == "Consensus" and subdict["TYPE"] == "REF":
+        for align_pos, subdict in vcf_dictionary.items():
+            if (value["Allele_Type"] == "Consensus" and subdict["TYPE"] == "REF") or (value["Allele"] == subdict['REF'] and subdict['TYPE'] not in ["DEL", "INS"]):
                 continue
             if 'SAMPLE_POS' in subdict and int(pos) in subdict['SAMPLE_POS']:
                 DP = []

From a036242079d1c79ffbc02647b40a51af9c828af2 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 1 Aug 2024 12:11:44 +0200
Subject: [PATCH 161/321] Added code to update minority allele

---
 .../ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py    | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index 218e6b49a..e76548233 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -489,6 +489,9 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                     "TYPE": subdict["TYPE"]
                 }
                 if value["Allele"] == content_dict["ALT"] or value["Allele_Type"] == "Minority" or content_dict["TYPE"] in ["INS", "DEL", "REF"]:
+                    if value["Allele_Type"] == "Minority":
+                        content_dict.update({"ALT": value["Allele"]})
+                        content_dict.update({"TYPE": "SNP"})
                     DP.append(value["Count"])
                     AF.append(value["Frequency"])
                     QUAL.append(value["Average_Quality"])

From 2b80fa500b4b2dcd26bb357d708158f5f8d58487 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 1 Aug 2024 12:12:51 +0200
Subject: [PATCH 162/321] Added code for minority deletions

---
 .../ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py         | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index e76548233..8d8a0860c 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -492,6 +492,13 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                     if value["Allele_Type"] == "Minority":
                         content_dict.update({"ALT": value["Allele"]})
                         content_dict.update({"TYPE": "SNP"})
+                    if value["Allele"] == "-" and value["Allele_Type"] == "Minority":
+                        REF = vcf_dictionary[align_pos-1]["REF"]+subdict["REF"]
+                        ALT = vcf_dictionary[align_pos-1]["REF"]
+                        content_dict.update({"REF_POS": vcf_dictionary[align_pos-1]["REF_POS"]})
+                        content_dict.update({"REF": REF})
+                        content_dict.update({"ALT": ALT})
+                        content_dict.update({"TYPE": "DEL"})
                     DP.append(value["Count"])
                     AF.append(value["Frequency"])
                     QUAL.append(value["Average_Quality"])

From 5276af32ffc5f1437f2c95dd0fd6c2b2198dc2de Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 1 Aug 2024 12:13:36 +0200
Subject: [PATCH 163/321] Fixed line that was excluding deletions

---
 .../ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py     | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index 8d8a0860c..9fdbaab73 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -516,7 +516,7 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                     af_vcf_dict[variant]["QUAL"] += QUAL
                 else:
                     af_vcf_dict[variant] = content_dict
-                break
+                pass
 
     return af_vcf_dict
 

From 321d1e3c0a220e631923c213168cbe2262688632 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 1 Aug 2024 12:13:49 +0200
Subject: [PATCH 164/321] Added total dp

---
 .../IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index 9fdbaab73..c94585904 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -500,6 +500,7 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                         content_dict.update({"ALT": ALT})
                         content_dict.update({"TYPE": "DEL"})
                     DP.append(value["Count"])
+                    TOTAL_DP.append(value["Total"])
                     AF.append(value["Frequency"])
                     QUAL.append(value["Average_Quality"])
                 else:

From 15166b12439f7846022794419ca9d02b67e6799d Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 1 Aug 2024 12:14:30 +0200
Subject: [PATCH 165/321] refactored a little bit

---
 .../ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py       | 9 ++++-----
 1 file changed, 4 insertions(+), 5 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index c94585904..5e26c29ab 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -625,7 +625,7 @@ def combine_indels(vcf_dictionary):
     """
 
     combined_vcf_dict = {}
-    for key, value in vcf_dictionary.items():
+    for _, value in vcf_dictionary.items():
         content_dict = {
             "CHROM": value["CHROM"],
             "REF_POS": value["REF_POS"],
@@ -658,11 +658,10 @@ def combine_indels(vcf_dictionary):
                 combined_vcf_dict[value["REF_POS"]] = content_dict
         elif value["TYPE"] == "DEL":
             sample_found = False
-            for pos, data in combined_vcf_dict.items():
-                var_type = data["TYPE"]
-                if var_type == "DEL":
+            for _, data in combined_vcf_dict.items():
+                if data["TYPE"] == "DEL":
                     if value["SAMPLE_POS"] == data["SAMPLE_POS"]:
-                        if value["TYPE"] == var_type:
+                        if value["TYPE"] == data["TYPE"]:
                             sample_found = data["REF_POS"]
                             break
                         else:

From 2eb5e3bd789746eab737dd3f80cc0ae1f7a80a49 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 1 Aug 2024 12:24:11 +0200
Subject: [PATCH 166/321] Updated docstrings

---
 .../04-irma/create_irma_vcf.py                | 66 +++++++++++++++----
 1 file changed, 53 insertions(+), 13 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index 5e26c29ab..e96ea42f8 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -324,6 +324,10 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                     "9",
                     "10"
                 ],
+                "TOTAL_DP": [
+                    "9",
+                    "10"
+                ],
                 "AF": [
                     "1",
                     "1"
@@ -333,7 +337,7 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                     "34"
                 ]
             },
-            "19": {
+            "EPI_ISL_18668201_10_A": {
                 "CHROM": "EPI_ISL_18668201",
                 "REF_POS": 10,
                 "SAMPLE_POS": [
@@ -345,6 +349,9 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                 "DP": [
                     "60"
                 ],
+                "TOTAL_DP": [
+                    "72"
+                ],
                 "AF": [
                     "0.833333333333333"
                 ],
@@ -352,7 +359,7 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                     "34.0166666666667"
                 ]
             },
-            "7542": {
+            "EPI_ISL_18668201_7531_TT": {
                 "CHROM": "EPI_ISL_18668201",
                 "REF_POS": 7531,
                 "SAMPLE_POS": [
@@ -364,6 +371,9 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                 "DP": [
                     "74"
                 ],
+                "TOTAL_DP": [
+                    "75"
+                ],
                 "AF": [
                     "0.986666666666667"
                 ],
@@ -371,7 +381,7 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                     "34.8648648648649"
                 ]
             },
-            "7543": {
+            "EPI_ISL_18668201_7531_TC": {
                 "CHROM": "EPI_ISL_18668201",
                 "REF_POS": 7531,
                 "SAMPLE_POS": [
@@ -383,6 +393,9 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                 "DP": [
                     "75"
                 ],
+                "TOTAL_DP": [
+                    "75"
+                ],
                 "AF": [
                     "1"
                 ],
@@ -390,7 +403,7 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                     "35.04"
                 ]
             },
-            "7544": {
+            "EPI_ISL_18668201_7531_CA": {
                 "CHROM": "EPI_ISL_18668201",
                 "REF_POS": 7531,
                 "SAMPLE_POS": [
@@ -402,6 +415,9 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                 "DP": [
                     "75"
                 ],
+                "TOTAL_DP": [
+                    "75"
+                ],
                 "AF": [
                     "1"
                 ],
@@ -409,9 +425,9 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                     "33.8533333333333"
                 ]
             },
-            "10081": {
+            "EPI_ISL_18668201_10067_A": {
                 "CHROM": "EPI_ISL_18668201",
-                "REF_POS": 10068,
+                "REF_POS": 10067,
                 "SAMPLE_POS": [
                     10079
                 ],
@@ -421,6 +437,9 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                 "DP": [
                     "10"
                 ],
+                "TOTAL_DP": [
+                    "10"
+                ],
                 "AF": [
                     "1"
                 ],
@@ -428,9 +447,9 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                     "34.3"
                 ]
             },
-            "10082": {
+            "EPI_ISL_18668201_10068_-": {
                 "CHROM": "EPI_ISL_18668201",
-                "REF_POS": 10069,
+                "REF_POS": 10068,
                 "SAMPLE_POS": [
                     10079
                 ],
@@ -440,6 +459,9 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                 "DP": [
                     "10"
                 ],
+                "TOTAL_DP": [
+                    "10"
+                ],
                 "AF": [
                     "1"
                 ],
@@ -447,9 +469,9 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                     "34.3"
                 ]
             },
-            "10083": {
+            "EPI_ISL_18668201_10069_-": {
                 "CHROM": "EPI_ISL_18668201",
-                "REF_POS": 10070,
+                "REF_POS": 10069,
                 "SAMPLE_POS": [
                     10079
                 ],
@@ -459,6 +481,9 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                 "DP": [
                     "10"
                 ],
+                "TOTAL_DP": [
+                    "10"
+                ],
                 "AF": [
                     "1"
                 ],
@@ -547,6 +572,10 @@ def combine_indels(vcf_dictionary):
                 "DP": [
                     "9"
                 ],
+                "TOTAL_DP": [
+                    "9",
+                    "10"
+                ],
                 "AF": [
                     "1"
                 ],
@@ -564,7 +593,10 @@ def combine_indels(vcf_dictionary):
                 "REF": "T",
                 "ALT": "A",
                 "DP": [
-                    "60"
+                    "72"
+                ],
+                "TOTAL_DP": [
+                    "10"
                 ],
                 "AF": [
                     "0.833333333333333"
@@ -589,6 +621,11 @@ def combine_indels(vcf_dictionary):
                     "75",
                     "75"
                 ],
+                "TOTAL_DP": [
+                    "75",
+                    "75",
+                    "75"
+                ],
                 "AF": [
                     "0.986666666666667",
                     "1",
@@ -601,9 +638,9 @@ def combine_indels(vcf_dictionary):
                 ],
                 "TYPE": "INS"
             },
-            "10068": {
+            "10067": {
                 "CHROM": "EPI_ISL_18668201",
-                "REF_POS": 10068,
+                "REF_POS": 10067,
                 "SAMPLE_POS": [
                     10079
                 ],
@@ -612,6 +649,9 @@ def combine_indels(vcf_dictionary):
                 "DP": [
                     "10"
                 ],
+                "TOTAL_DP": [
+                    "10",
+                ],
                 "AF": [
                     "1"
                 ],

From 182af9b41ef3a63a18a980d0ae3c0238c91834f6 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 1 Aug 2024 12:25:17 +0200
Subject: [PATCH 167/321] black

---
 .../04-irma/create_irma_vcf.py                | 140 +++++++++++++-----
 1 file changed, 102 insertions(+), 38 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index e96ea42f8..b12d27ec2 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -107,17 +107,19 @@ def alleles_to_dict(alleles_file, frequency, depth):
 
     alleles_dict = {}
     with open(alleles_file, "r") as file:
-        header = file.readline().strip().split('\t')
+        header = file.readline().strip().split("\t")
         for line in file:
-            while line.count('\t') < len(header) - 1:
+            while line.count("\t") < len(header) - 1:
                 line += file.readline()
-            line_data = line.strip().split('\t')
+            line_data = line.strip().split("\t")
             position = int(line_data[1])
             variant_af = float(line_data[5])
             position_dp = float(line_data[4])
             if variant_af >= frequency and position_dp >= depth:
                 entry_dict = {header[i]: line_data[i] for i in range(len(header))}
-                variant = str(line_data[0]) + "_" + str(position) + "_" + str(line_data[2])
+                variant = (
+                    str(line_data[0]) + "_" + str(position) + "_" + str(line_data[2])
+                )
                 alleles_dict[variant] = entry_dict
     return alleles_dict
 
@@ -246,9 +248,9 @@ def align2dict(alignment_file):
                     "CHROM": CHROM,
                     "REF_POS": ref_position,
                     "SAMPLE_POS": [sample_position],
-                    "REF": sample_seq[i-1],
-                    "ALT": sample_seq[i-1] + sample_base,
-                    "TYPE": "INS"
+                    "REF": sample_seq[i - 1],
+                    "ALT": sample_seq[i - 1] + sample_base,
+                    "TYPE": "INS",
                 }
                 vcf_dict[align_position] = content_dict
         elif ref_position == 1 and len(SAMPLE_POS) > 1:
@@ -258,37 +260,48 @@ def align2dict(alignment_file):
                 "SAMPLE_POS": SAMPLE_POS,
                 "REF": ref_base,
                 "ALT": ALT + sample_base,
-                "TYPE": "INS"
+                "TYPE": "INS",
             }
             vcf_dict[align_position] = content_dict
         elif sample_base == "-" and ref_base != "N":
             content_dict = {
                 "CHROM": CHROM,
-                "REF_POS": ref_position-1,
+                "REF_POS": ref_position - 1,
                 "SAMPLE_POS": [sample_position],
-                "REF": sample_seq[i-1] + ref_base,
-                "ALT": sample_seq[i-1],
-                "TYPE": "DEL"
+                "REF": sample_seq[i - 1] + ref_base,
+                "ALT": sample_seq[i - 1],
+                "TYPE": "DEL",
             }
             vcf_dict[align_position] = content_dict
-        elif ref_base != sample_base and ref_base != "N" and ref_base != "-" and sample_base != "N" and sample_base != "-":
+        elif (
+            ref_base != sample_base
+            and ref_base != "N"
+            and ref_base != "-"
+            and sample_base != "N"
+            and sample_base != "-"
+        ):
             content_dict = {
                 "CHROM": CHROM,
                 "REF_POS": ref_position,
                 "SAMPLE_POS": [sample_position],
                 "REF": ref_base,
                 "ALT": sample_base,
-                "TYPE": "SNP"
+                "TYPE": "SNP",
             }
             vcf_dict[align_position] = content_dict
-        elif ref_base != "N" and ref_base != "-" and sample_base != "N" and sample_base != "-":
+        elif (
+            ref_base != "N"
+            and ref_base != "-"
+            and sample_base != "N"
+            and sample_base != "-"
+        ):
             content_dict = {
                 "CHROM": CHROM,
                 "REF_POS": ref_position,
                 "SAMPLE_POS": [sample_position],
                 "REF": ref_base,
                 "ALT": sample_base,
-                "TYPE": "REF"
+                "TYPE": "REF",
             }
             vcf_dict[align_position] = content_dict
     return vcf_dict
@@ -498,9 +511,12 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
     for _, value in alleles_dictionary.items():
         pos = value["Position"]
         for align_pos, subdict in vcf_dictionary.items():
-            if (value["Allele_Type"] == "Consensus" and subdict["TYPE"] == "REF") or (value["Allele"] == subdict['REF'] and subdict['TYPE'] not in ["DEL", "INS"]):
+            if (value["Allele_Type"] == "Consensus" and subdict["TYPE"] == "REF") or (
+                value["Allele"] == subdict["REF"]
+                and subdict["TYPE"] not in ["DEL", "INS"]
+            ):
                 continue
-            if 'SAMPLE_POS' in subdict and int(pos) in subdict['SAMPLE_POS']:
+            if "SAMPLE_POS" in subdict and int(pos) in subdict["SAMPLE_POS"]:
                 DP = []
                 TOTAL_DP = []
                 AF = []
@@ -511,16 +527,22 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                     "SAMPLE_POS": subdict["SAMPLE_POS"],
                     "REF": subdict["REF"],
                     "ALT": subdict["ALT"],
-                    "TYPE": subdict["TYPE"]
+                    "TYPE": subdict["TYPE"],
                 }
-                if value["Allele"] == content_dict["ALT"] or value["Allele_Type"] == "Minority" or content_dict["TYPE"] in ["INS", "DEL", "REF"]:
+                if (
+                    value["Allele"] == content_dict["ALT"]
+                    or value["Allele_Type"] == "Minority"
+                    or content_dict["TYPE"] in ["INS", "DEL", "REF"]
+                ):
                     if value["Allele_Type"] == "Minority":
                         content_dict.update({"ALT": value["Allele"]})
                         content_dict.update({"TYPE": "SNP"})
                     if value["Allele"] == "-" and value["Allele_Type"] == "Minority":
-                        REF = vcf_dictionary[align_pos-1]["REF"]+subdict["REF"]
-                        ALT = vcf_dictionary[align_pos-1]["REF"]
-                        content_dict.update({"REF_POS": vcf_dictionary[align_pos-1]["REF_POS"]})
+                        REF = vcf_dictionary[align_pos - 1]["REF"] + subdict["REF"]
+                        ALT = vcf_dictionary[align_pos - 1]["REF"]
+                        content_dict.update(
+                            {"REF_POS": vcf_dictionary[align_pos - 1]["REF_POS"]}
+                        )
                         content_dict.update({"REF": REF})
                         content_dict.update({"ALT": ALT})
                         content_dict.update({"TYPE": "DEL"})
@@ -532,8 +554,16 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                     print("SNP not the same in .fasta file and alleles file")
                     print(value)
                     print(content_dict)
-                content_dict.update({"DP": DP, "TOTAL_DP": TOTAL_DP, "AF": AF, "QUAL": QUAL})
-                variant = content_dict["CHROM"] + "_" + str(content_dict["REF_POS"]) + "_" + content_dict["ALT"]
+                content_dict.update(
+                    {"DP": DP, "TOTAL_DP": TOTAL_DP, "AF": AF, "QUAL": QUAL}
+                )
+                variant = (
+                    content_dict["CHROM"]
+                    + "_"
+                    + str(content_dict["REF_POS"])
+                    + "_"
+                    + content_dict["ALT"]
+                )
 
                 if variant in af_vcf_dict:
                     af_vcf_dict[variant]["DP"] += DP
@@ -676,16 +706,20 @@ def combine_indels(vcf_dictionary):
             "TOTAL_DP": value["TOTAL_DP"],
             "AF": value["AF"],
             "QUAL": value["QUAL"],
-            "TYPE": value["TYPE"]
+            "TYPE": value["TYPE"],
         }
         if value["TYPE"] == "INS":
             if value["REF_POS"] in combined_vcf_dict:
                 if value["TYPE"] == combined_vcf_dict[value["REF_POS"]]["TYPE"]:
                     NEW_ALT = value["ALT"].replace(value["REF"], "")
                     combined_vcf_dict[value["REF_POS"]]["ALT"] += NEW_ALT
-                    combined_vcf_dict[value["REF_POS"]]["SAMPLE_POS"].append(value["SAMPLE_POS"][0])
+                    combined_vcf_dict[value["REF_POS"]]["SAMPLE_POS"].append(
+                        value["SAMPLE_POS"][0]
+                    )
                     combined_vcf_dict[value["REF_POS"]]["DP"].append(value["DP"][0])
-                    combined_vcf_dict[value["REF_POS"]]["TOTAL_DP"].append(value["TOTAL_DP"][0])
+                    combined_vcf_dict[value["REF_POS"]]["TOTAL_DP"].append(
+                        value["TOTAL_DP"][0]
+                    )
                     combined_vcf_dict[value["REF_POS"]]["AF"].append(value["AF"][0])
                     combined_vcf_dict[value["REF_POS"]]["QUAL"].append(value["QUAL"][0])
                 else:
@@ -751,14 +785,12 @@ def get_vcf_header(chromosome, sample_name):
     header_source = ["##fileformat=VCFv4.2", "##source=custom"]
     header_contig = []
     if chromosome:
-        header_contig += [
-            "##contig=<ID=" + chromosome + ">"
-        ]
+        header_contig += ["##contig=<ID=" + chromosome + ">"]
         header_source += header_contig
 
     header_info = [
         '##INFO=<ID=TYPE,Number=1,Type=String,Description="Either SNP (Single Nucleotide Polymorphism), DEL (deletion) or INS (Insertion)">',
-        '##INFO=<ID=DP,Number=1,Type=Integer,Description="Total Depth">'
+        '##INFO=<ID=DP,Number=1,Type=Integer,Description="Total Depth">',
     ]
     header_filter = [
         '##FILTER=<ID=PASS,Description="All filters passed">',
@@ -769,9 +801,7 @@ def get_vcf_header(chromosome, sample_name):
         '##FORMAT=<ID=ALT_QUAL,Number=1,Type=Integer,Description="Mean quality of alternate base">',
         '##FORMAT=<ID=ALT_FREQ,Number=1,Type=Float,Description="Frequency of alternate base">',
     ]
-    columns = [
-        '#CHROM\tPOS\tID\tREF\tALT\tQUAL\tFILTER\tINFO\tFORMAT\t' + sample_name
-    ]
+    columns = ["#CHROM\tPOS\tID\tREF\tALT\tQUAL\tFILTER\tINFO\tFORMAT\t" + sample_name]
     header = header_source + header_info + header_filter + header_format + columns
     return header
 
@@ -809,7 +839,13 @@ def create_vcf(variants_dict, out_vcf, alignment):
             REF = value["REF"]
             ALT = value["ALT"]
             TOTAL_DP_list = [int(number) for number in value["TOTAL_DP"]]
-            INFO = "TYPE=" + value["TYPE"] + ';' + "DP=" + str(round(statistics.mean(TOTAL_DP_list)))
+            INFO = (
+                "TYPE="
+                + value["TYPE"]
+                + ";"
+                + "DP="
+                + str(round(statistics.mean(TOTAL_DP_list)))
+            )
             ALT_QUAL_list = []
             for number in value["QUAL"]:
                 if number != "NA":
@@ -819,8 +855,36 @@ def create_vcf(variants_dict, out_vcf, alignment):
                     ALT_QUAL = "NA"
             ALT_DP_list = [int(number) for number in value["DP"]]
             AF_list = [float(number) for number in value["AF"]]
-            SAMPLE = GT + ':' + str(round(statistics.mean(ALT_DP_list))) + ':' + ALT_QUAL + ':' + str(round(statistics.mean(AF_list), 4))
-            oline = CHROM + '\t' + str(POS) + '\t' + ID + '\t' + REF + '\t' + ALT + '\t' + QUAL + '\t' + FILTER + '\t' + INFO + '\t' + FORMAT + '\t' + SAMPLE
+            SAMPLE = (
+                GT
+                + ":"
+                + str(round(statistics.mean(ALT_DP_list)))
+                + ":"
+                + ALT_QUAL
+                + ":"
+                + str(round(statistics.mean(AF_list), 4))
+            )
+            oline = (
+                CHROM
+                + "\t"
+                + str(POS)
+                + "\t"
+                + ID
+                + "\t"
+                + REF
+                + "\t"
+                + ALT
+                + "\t"
+                + QUAL
+                + "\t"
+                + FILTER
+                + "\t"
+                + INFO
+                + "\t"
+                + FORMAT
+                + "\t"
+                + SAMPLE
+            )
             file_out.write(oline + "\n")
 
 

From a698f50ef8017524e513e76b28859588959fdebc Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 1 Aug 2024 13:14:25 +0200
Subject: [PATCH 168/321] Updated changelog

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index d2dc42510..8da193baa 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -56,6 +56,7 @@ Code contributions to the new version:
 - Updated services.json, mtbseq's lablog, viralrecon's lablog and assembly's config file [#299](https://github.com/BU-ISCIII/buisciii-tools/pull/299)
 - Added lablog to automate gene characterization with emmtyper, including unzipping assemblies. [#300](https://github.com/BU-ISCIII/buisciii-tools/pull/300)
 - Fixed 99-stats (MAG) template. [#301](https://github.com/BU-ISCIII/buisciii-tools/pull/301)
+- Created a python script to process IRMA's results and create a standard vcf file against reference. [#304](https://github.com/BU-ISCIII/buisciii-tools/pull/304)
 - Fixed IRMA's lablog so that the sequences of the samples are not displayed several times neither in the .txt files of each influenza type nor in all_samples_completo.txt [#305](https://github.com/BU-ISCIII/buisciii-tools/pull/305)
 - Modified bioinfo_doc.py so that new lines in the delivery message are applied in the email [#307](https://github.com/BU-ISCIII/buisciii-tools/pull/307)
 - Added several improvements in lablog_viralrecon (created log files, modified check_references function behaviour, enabled config files regeneration) [#306](https://github.com/BU-ISCIII/buisciii-tools/pull/306)

From 432ebd88f7cb9f5bb8008c33f4ea0421930d718e Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Tue, 6 Aug 2024 12:58:04 +0200
Subject: [PATCH 169/321] Managed deletions at the begining of alignment

---
 .../04-irma/create_irma_vcf.py                | 61 +++++++++++++++----
 1 file changed, 50 insertions(+), 11 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index b12d27ec2..2d1129446 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -264,15 +264,26 @@ def align2dict(alignment_file):
             }
             vcf_dict[align_position] = content_dict
         elif sample_base == "-" and ref_base != "N":
-            content_dict = {
-                "CHROM": CHROM,
-                "REF_POS": ref_position - 1,
-                "SAMPLE_POS": [sample_position],
-                "REF": sample_seq[i - 1] + ref_base,
-                "ALT": sample_seq[i - 1],
-                "TYPE": "DEL",
-            }
-            vcf_dict[align_position] = content_dict
+            if sample_position == 0:
+                content_dict = {
+                    "CHROM": CHROM,
+                    "REF_POS": ref_position,
+                    "SAMPLE_POS": [sample_position],
+                    "REF": ref_base + ref_seq[i + 1],
+                    "ALT": ref_seq[i + 1],
+                    "TYPE": "DEL",
+                }
+                vcf_dict[align_position] = content_dict
+            else:
+                content_dict = {
+                    "CHROM": CHROM,
+                    "REF_POS": ref_position - 1,
+                    "SAMPLE_POS": [sample_position],
+                    "REF": sample_seq[i - 1] + ref_base,
+                    "ALT": sample_seq[i - 1],
+                    "TYPE": "DEL",
+                }
+                vcf_dict[align_position] = content_dict
         elif (
             ref_base != sample_base
             and ref_base != "N"
@@ -516,6 +527,29 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
                 and subdict["TYPE"] not in ["DEL", "INS"]
             ):
                 continue
+            if 0 in subdict["SAMPLE_POS"] and len(subdict["SAMPLE_POS"]) == 1:
+                content_dict = {
+                    "CHROM": subdict["CHROM"],
+                    "REF_POS": subdict["REF_POS"],
+                    "SAMPLE_POS": subdict["SAMPLE_POS"],
+                    "REF": subdict["REF"],
+                    "ALT": subdict["ALT"],
+                    "TYPE": subdict["TYPE"],
+                    "DP": ["NA"],
+                    "TOTAL_DP": ["NA"],
+                    "AF": ["NA"],
+                    "QUAL": ["NA"],
+                }
+                variant = (
+                    content_dict["CHROM"]
+                    + "_"
+                    + str(content_dict["REF_POS"])
+                    + "_"
+                    + content_dict["ALT"]
+                )
+                af_vcf_dict[variant] = content_dict
+                pass
+
             if "SAMPLE_POS" in subdict and int(pos) in subdict["SAMPLE_POS"]:
                 DP = []
                 TOTAL_DP = []
@@ -745,8 +779,12 @@ def combine_indels(vcf_dictionary):
                             print("combined_vcf_dict")
                             print(combined_vcf_dict[value["REF_POS"]])
             if sample_found:
-                NEW_REF = value["REF"].replace(value["ALT"], "")
-                combined_vcf_dict[sample_found]["REF"] += NEW_REF
+                if 0 in value["SAMPLE_POS"] and len(value["SAMPLE_POS"]) == 1:
+                    combined_vcf_dict[sample_found]["REF"] += value["ALT"]
+                    combined_vcf_dict[sample_found]["ALT"] = value["ALT"]
+                else:
+                    NEW_REF = value["REF"][len(value["ALT"]):]
+                    combined_vcf_dict[sample_found]["REF"] += NEW_REF
             else:
                 combined_vcf_dict[value["REF_POS"]] = content_dict
         elif value["TYPE"] == "SNP":
@@ -909,3 +947,4 @@ def main(args=None):
 
 if __name__ == "__main__":
     sys.exit(main())
+

From 69f7193421eca9bc6a79a4d39f345ce5f7241c30 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Tue, 6 Aug 2024 12:58:44 +0200
Subject: [PATCH 170/321] Managed missing data in stats

---
 .../04-irma/create_irma_vcf.py                | 44 +++++++++++++++----
 1 file changed, 35 insertions(+), 9 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index 2d1129446..613d7f909 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -876,31 +876,57 @@ def create_vcf(variants_dict, out_vcf, alignment):
             POS = value["REF_POS"]
             REF = value["REF"]
             ALT = value["ALT"]
-            TOTAL_DP_list = [int(number) for number in value["TOTAL_DP"]]
+            TOTAL_DP_list = []
+            for number in value["TOTAL_DP"]:
+                if number != "NA":
+                    TOTAL_DP_list.append(int(number))
+            if TOTAL_DP_list:
+                TOTAL_DP = str(round(statistics.mean(TOTAL_DP_list)))
+            else:
+                TOTAL_DP = "NA"
+
             INFO = (
                 "TYPE="
                 + value["TYPE"]
                 + ";"
                 + "DP="
-                + str(round(statistics.mean(TOTAL_DP_list)))
+                + TOTAL_DP
             )
             ALT_QUAL_list = []
             for number in value["QUAL"]:
                 if number != "NA":
                     ALT_QUAL_list.append(float(number))
-                    ALT_QUAL = str(round(statistics.mean(ALT_QUAL_list), 2))
-                else:
-                    ALT_QUAL = "NA"
-            ALT_DP_list = [int(number) for number in value["DP"]]
-            AF_list = [float(number) for number in value["AF"]]
+            if ALT_QUAL_list:
+                ALT_QUAL = str(round(statistics.mean(ALT_QUAL_list), 2))
+            else:
+                ALT_QUAL = "NA"
+
+            ALT_DP_list = []
+            for number in value["DP"]:
+                if number != "NA":
+                    ALT_DP_list.append(int(number))
+            if ALT_DP_list:
+                ALT_DP = str(round(statistics.mean(ALT_DP_list), 0))
+            else:
+                ALT_DP = "NA"
+
+            AF_list = []
+            for number in value["AF"]:
+                if number != "NA":
+                    AF_list.append(float(number))
+            if AF_list:
+                AF = str(round(statistics.mean(AF_list), 4))
+            else:
+                AF = "NA"
+
             SAMPLE = (
                 GT
                 + ":"
-                + str(round(statistics.mean(ALT_DP_list)))
+                + ALT_DP
                 + ":"
                 + ALT_QUAL
                 + ":"
-                + str(round(statistics.mean(AF_list), 4))
+                + AF
             )
             oline = (
                 CHROM

From d5c64ba109cfa13ddaebf69c2feb1e52d8787de6 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Tue, 6 Aug 2024 12:59:44 +0200
Subject: [PATCH 171/321] Managed minority deletions

---
 .../ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py        | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index 613d7f909..9f62e73dc 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -778,6 +778,9 @@ def combine_indels(vcf_dictionary):
                             print(value)
                             print("combined_vcf_dict")
                             print(combined_vcf_dict[value["REF_POS"]])
+                    elif minority and prev_sample_pos in data["SAMPLE_POS"]:
+                        sample_found = data["REF_POS"]
+                        break
             if sample_found:
                 if 0 in value["SAMPLE_POS"] and len(value["SAMPLE_POS"]) == 1:
                     combined_vcf_dict[sample_found]["REF"] += value["ALT"]
@@ -785,6 +788,11 @@ def combine_indels(vcf_dictionary):
                 else:
                     NEW_REF = value["REF"][len(value["ALT"]):]
                     combined_vcf_dict[sample_found]["REF"] += NEW_REF
+                    if minority:
+                        combined_vcf_dict[sample_found]["SAMPLE_POS"] += value["SAMPLE_POS"]
+                        combined_vcf_dict[sample_found]["DP"] += value["DP"]
+                        combined_vcf_dict[sample_found]["TOTAL_DP"] += value["TOTAL_DP"]
+                        combined_vcf_dict[sample_found]["AF"] += value["AF"]
             else:
                 combined_vcf_dict[value["REF_POS"]] = content_dict
         elif value["TYPE"] == "SNP":

From 8ba38eeea871d11b8dbe6aacfb8052855db53bd6 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Tue, 6 Aug 2024 13:03:08 +0200
Subject: [PATCH 172/321] managed minority deletions

---
 .../ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py        | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index 9f62e73dc..47f0f7859 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -766,6 +766,14 @@ def combine_indels(vcf_dictionary):
                 combined_vcf_dict[value["REF_POS"]] = content_dict
         elif value["TYPE"] == "DEL":
             sample_found = False
+            minority = False
+            for af in value["AF"]:
+                if float(af) < 0.5:
+                    minority = True
+            prev_sample_pos = ""
+            if minority and len(value["SAMPLE_POS"]) == 1:
+                sample_pos = value["SAMPLE_POS"][0]
+                prev_sample_pos = sample_pos - 1
             for _, data in combined_vcf_dict.items():
                 if data["TYPE"] == "DEL":
                     if value["SAMPLE_POS"] == data["SAMPLE_POS"]:

From 878a42b1aed6e2f17ee0bb53c8e14d18b0de4b1e Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Tue, 6 Aug 2024 13:05:47 +0200
Subject: [PATCH 173/321] black

---
 .../04-irma/create_irma_vcf.py                | 25 +++++--------------
 1 file changed, 6 insertions(+), 19 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index 47f0f7859..462d19b57 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -794,10 +794,12 @@ def combine_indels(vcf_dictionary):
                     combined_vcf_dict[sample_found]["REF"] += value["ALT"]
                     combined_vcf_dict[sample_found]["ALT"] = value["ALT"]
                 else:
-                    NEW_REF = value["REF"][len(value["ALT"]):]
+                    NEW_REF = value["REF"][len(value["ALT"]) :]
                     combined_vcf_dict[sample_found]["REF"] += NEW_REF
                     if minority:
-                        combined_vcf_dict[sample_found]["SAMPLE_POS"] += value["SAMPLE_POS"]
+                        combined_vcf_dict[sample_found]["SAMPLE_POS"] += value[
+                            "SAMPLE_POS"
+                        ]
                         combined_vcf_dict[sample_found]["DP"] += value["DP"]
                         combined_vcf_dict[sample_found]["TOTAL_DP"] += value["TOTAL_DP"]
                         combined_vcf_dict[sample_found]["AF"] += value["AF"]
@@ -901,13 +903,7 @@ def create_vcf(variants_dict, out_vcf, alignment):
             else:
                 TOTAL_DP = "NA"
 
-            INFO = (
-                "TYPE="
-                + value["TYPE"]
-                + ";"
-                + "DP="
-                + TOTAL_DP
-            )
+            INFO = "TYPE=" + value["TYPE"] + ";" + "DP=" + TOTAL_DP
             ALT_QUAL_list = []
             for number in value["QUAL"]:
                 if number != "NA":
@@ -935,15 +931,7 @@ def create_vcf(variants_dict, out_vcf, alignment):
             else:
                 AF = "NA"
 
-            SAMPLE = (
-                GT
-                + ":"
-                + ALT_DP
-                + ":"
-                + ALT_QUAL
-                + ":"
-                + AF
-            )
+            SAMPLE = GT + ":" + ALT_DP + ":" + ALT_QUAL + ":" + AF
             oline = (
                 CHROM
                 + "\t"
@@ -989,4 +977,3 @@ def main(args=None):
 
 if __name__ == "__main__":
     sys.exit(main())
-

From b1f4ba6d7cddebe5ed41f7d0bfbabbe6e4722cb9 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Wed, 7 Aug 2024 09:48:50 +0200
Subject: [PATCH 174/321] Fixed alt_allele in insertions

---
 .../ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py     | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index 462d19b57..47c7c2523 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -745,7 +745,7 @@ def combine_indels(vcf_dictionary):
         if value["TYPE"] == "INS":
             if value["REF_POS"] in combined_vcf_dict:
                 if value["TYPE"] == combined_vcf_dict[value["REF_POS"]]["TYPE"]:
-                    NEW_ALT = value["ALT"].replace(value["REF"], "")
+                    NEW_ALT = value["ALT"][len(value["REF"]) :]
                     combined_vcf_dict[value["REF_POS"]]["ALT"] += NEW_ALT
                     combined_vcf_dict[value["REF_POS"]]["SAMPLE_POS"].append(
                         value["SAMPLE_POS"][0]

From 258c2cbfdfac9b5452b3f8b13a195b3074d063c0 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Wed, 7 Aug 2024 09:49:33 +0200
Subject: [PATCH 175/321] Added management of low af insertions at the end of
 the sequence

---
 .../04-irma/create_irma_vcf.py                | 45 ++++++++++++++++++-
 1 file changed, 43 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
index 47c7c2523..1cd416723 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_vcf.py
@@ -318,7 +318,7 @@ def align2dict(alignment_file):
     return vcf_dict
 
 
-def stats_vcf(vcf_dictionary, alleles_dictionary):
+def stats_vcf(vcf_dictionary, alleles_dictionary, last_pos, last_allele):
     """Add stats to VCF dictionary.
 
     Parameters
@@ -521,6 +521,41 @@ def stats_vcf(vcf_dictionary, alleles_dictionary):
     af_vcf_dict = {}
     for _, value in alleles_dictionary.items():
         pos = value["Position"]
+        chrom = next(iter(vcf_dictionary.values()))["CHROM"]
+
+        if int(pos) > last_pos and value["Allele_Type"] == "Minority":
+            content_dict = {
+                "CHROM": chrom,
+                "REF_POS": last_pos,
+                "SAMPLE_POS": [pos],
+                "REF": last_allele,
+                "ALT": last_allele + value["Allele"],
+                "TYPE": "INS",
+                "DP": [value["Count"]],
+                "TOTAL_DP": [value["Total"]],
+                "AF": [value["Frequency"]],
+                "QUAL": [value["Frequency"]],
+            }
+
+            variant = (
+                content_dict["CHROM"]
+                + "_"
+                + str(content_dict["REF_POS"])
+                + "_"
+                + "final_ins"
+            )
+
+            if variant in af_vcf_dict:
+                af_vcf_dict[variant]["DP"] += content_dict["DP"]
+                af_vcf_dict[variant]["TOTAL_DP"] += content_dict["TOTAL_DP"]
+                af_vcf_dict[variant]["AF"] += content_dict["AF"]
+                af_vcf_dict[variant]["QUAL"] += content_dict["QUAL"]
+                af_vcf_dict[variant]["SAMPLE_POS"] += content_dict["SAMPLE_POS"]
+                af_vcf_dict[variant]["ALT"] += value["Allele"]
+            else:
+                af_vcf_dict[variant] = content_dict
+            pass
+
         for align_pos, subdict in vcf_dictionary.items():
             if (value["Allele_Type"] == "Consensus" and subdict["TYPE"] == "REF") or (
                 value["Allele"] == subdict["REF"]
@@ -970,7 +1005,13 @@ def main(args=None):
     # Start analysis
     alleles_dict = alleles_to_dict(all_alleles, freq, dp)
     alignment_dict = align2dict(alignment)
-    af_vcf_dict = stats_vcf(alignment_dict, alleles_dict)
+    last_ref_pos = max(position["REF_POS"] for position in alignment_dict.values())
+    last_ref_allele = None
+    for _, value in alignment_dict.items():
+        if value["REF_POS"] == last_ref_pos:
+            last_ref_allele = value["REF"]
+            break
+    af_vcf_dict = stats_vcf(alignment_dict, alleles_dict, last_ref_pos, last_ref_allele)
     combined_vcf_dict = combine_indels(af_vcf_dict)
     create_vcf(combined_vcf_dict, output_vcf, alignment)
 

From e229ed7d3fcca5ef1abb87fb0adb2733f3a0994c Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Fri, 16 Aug 2024 12:47:43 +0200
Subject: [PATCH 176/321] Added mvmoneo  to sftp users

---
 bu_isciii/templates/sftp_user.json | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bu_isciii/templates/sftp_user.json b/bu_isciii/templates/sftp_user.json
index fff8c4a4b..04773c8fb 100755
--- a/bu_isciii/templates/sftp_user.json
+++ b/bu_isciii/templates/sftp_user.json
@@ -50,5 +50,6 @@
     "svazquez": ["Labvirusres"],
     "ycampos": ["LabUfiecMithocondrial"],
     "anadonoso": ["Labenterovirus"],
+    "mvmoneo": ["SpainUDP"],
     "bioinfoadm": ["test"]
 }

From 6e6e27ef3364b59f1aeb4a4df6a45fa34c3770b0 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Fri, 16 Aug 2024 12:48:56 +0200
Subject: [PATCH 177/321] Updated changelog

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 8da193baa..5b352a739 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -61,6 +61,7 @@ Code contributions to the new version:
 - Modified bioinfo_doc.py so that new lines in the delivery message are applied in the email [#307](https://github.com/BU-ISCIII/buisciii-tools/pull/307)
 - Added several improvements in lablog_viralrecon (created log files, modified check_references function behaviour, enabled config files regeneration) [#306](https://github.com/BU-ISCIII/buisciii-tools/pull/306)
 - Fixed bug when lablog_viralrecon tries to download references that don't belong to any family. [#310](https://github.com/BU-ISCIII/buisciii-tools/pull/310)
+-Added mvmoneo to SFTP users. [#317](https://github.com/BU-ISCIII/buisciii-tools/pull/317)
 
 ### Modules
 

From 5db8f81a3c03c41b3a4daf4ba0644cecd5e2dc14 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Fri, 16 Aug 2024 12:50:06 +0200
Subject: [PATCH 178/321] fixed typo

---
 CHANGELOG.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 5b352a739..c81d1d99d 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -61,7 +61,7 @@ Code contributions to the new version:
 - Modified bioinfo_doc.py so that new lines in the delivery message are applied in the email [#307](https://github.com/BU-ISCIII/buisciii-tools/pull/307)
 - Added several improvements in lablog_viralrecon (created log files, modified check_references function behaviour, enabled config files regeneration) [#306](https://github.com/BU-ISCIII/buisciii-tools/pull/306)
 - Fixed bug when lablog_viralrecon tries to download references that don't belong to any family. [#310](https://github.com/BU-ISCIII/buisciii-tools/pull/310)
--Added mvmoneo to SFTP users. [#317](https://github.com/BU-ISCIII/buisciii-tools/pull/317)
+- Added mvmoneo to SFTP users. [#317](https://github.com/BU-ISCIII/buisciii-tools/pull/317)
 
 ### Modules
 

From 051504cbc664cd9a880647a66be7dca0adf26280 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Wed, 14 Aug 2024 13:35:34 +0200
Subject: [PATCH 179/321] updated new tx2gene table name innf-core pipeline

---
 .../02-differential_expression/differential_expression.R       | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/differential_expression.R b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/differential_expression.R
index 160d69dcc..f684a1841 100644
--- a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/differential_expression.R
+++ b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/differential_expression.R
@@ -550,13 +550,14 @@ cat(blue("########################\nStarting with loading data\n################
 
 ####LOAD TRANSCRIPT RELATION DATA FILE #########################
 if (opt$differential_expression != "DEM") {
-  tx2gene <- read.table(file.path(opt$rnaseq_dir, "star_salmon", "salmon_tx2gene.tsv"), header = F)
+  tx2gene <- read.table(file.path(opt$rnaseq_dir, "star_salmon", "tx2gene.tsv"), header = F)
   colnames(tx2gene) <- c("TXNAME", "GENEID", "gene_name")
   if ( opt$differential_expression == "DEG") {
     gene_genename <- tx2gene[,c(2:3)]
     gene_genename <- gene_genename %>% distinct()
   }
 }
+
 ####LOAD CLINICAL DATA FILE #########################
 samples_clin_data <- load_sample_data(clinical_data = opt$sample_data, group = opt$group_col)
 

From 7c82f7ee132b10cfc9464ed28b7c71335c156f66 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Wed, 14 Aug 2024 13:35:49 +0200
Subject: [PATCH 180/321] updated plots por DETs

---
 .../differential_expression.R                 | 27 ++++++++++++++-----
 1 file changed, 21 insertions(+), 6 deletions(-)

diff --git a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/differential_expression.R b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/differential_expression.R
index f684a1841..f1a7f397a 100644
--- a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/differential_expression.R
+++ b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/differential_expression.R
@@ -363,9 +363,17 @@ differential_plots <- function(res_de, de_results, ntd_subset, dds_subset){
   rownames(df) <- colnames(ntd_subset)
   to_plot <- assay_ntd[select,]
   to_plot_geneid <- as.data.frame(rownames(to_plot))
-  colnames(to_plot_geneid) <- "GeneID"
-  to_plot_geneid_merged <- merge(x = to_plot_geneid, y = gene_genename, by.x="GeneID", by.y = "GENEID", all.x = TRUE, all.y = FALSE)
-  rownames(to_plot) <- to_plot_geneid_merged$gene_name
+  if ( opt$differential_expression == "DEG") {
+    colnames(to_plot_geneid) <- "GeneID"
+    to_plot_geneid_merged <- merge(x = to_plot_geneid, y = gene_genename, by.x="GeneID", by.y = "GENEID", all.x = TRUE, all.y = FALSE)
+    rownames(to_plot) <- to_plot_geneid_merged$gene_name
+  }
+
+  if ( opt$differential_expression == "DET") { 
+    colnames(to_plot_geneid) <- "TranscriptID"
+    rownames(to_plot) <- to_plot_geneid$TranscriptID
+  }
+
   pdf(file="Differential_expression/DESeq2/heatmapCount_top20_differentially_expressed.pdf")
   pheatmap(to_plot, cluster_rows=TRUE, show_rownames=TRUE,
            cluster_cols=TRUE, annotation_col=df, main="Top 20 significant genes")
@@ -444,9 +452,16 @@ quality_plots <- function(data_subset){
   
   to_plot <- assay(data_subset$subset_ntd)[select,]
   to_plot_geneid <- as.data.frame(rownames(to_plot))
-  colnames(to_plot_geneid) <- "GeneID"
-  to_plot_geneid_merged <- merge(x = to_plot_geneid, y = gene_genename, by.x="GeneID", by.y = "GENEID", all.x = TRUE, all.y = FALSE)
-  rownames(to_plot) <- to_plot_geneid_merged$gene_name
+  if ( opt$differential_expression == "DEG") {
+    colnames(to_plot_geneid) <- "GeneID"
+    to_plot_geneid_merged <- merge(x = to_plot_geneid, y = gene_genename, by.x="GeneID", by.y = "GENEID", all.x = TRUE, all.y = FALSE)
+    rownames(to_plot) <- to_plot_geneid_merged$gene_name
+  }
+
+  if ( opt$differential_expression == "DET") { 
+    colnames(to_plot_geneid) <- "TranscriptID"
+    rownames(to_plot) <- to_plot_geneid$TranscriptID
+  }
   
   pdf(file="Quality_plots/DESeq2/heatmapCount_top20_highest_expression.pdf")
   pheatmap(to_plot, cluster_rows=FALSE, show_rownames=TRUE,

From 1d42ab1a58d73b0c420ee4423823624c051fd258 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Wed, 14 Aug 2024 13:36:12 +0200
Subject: [PATCH 181/321] added original timeseries script

---
 .../time_series_differential_expression.R     | 343 ++++++++++++++++++
 1 file changed, 343 insertions(+)
 create mode 100644 bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R

diff --git a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
new file mode 100644
index 000000000..5ad14850b
--- /dev/null
+++ b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
@@ -0,0 +1,343 @@
+#!/usr/bin/env Rscript
+
+################################################
+################################################
+## LOAD LIBRARIES                             ##
+################################################
+################################################
+
+####DESeq2 libraries
+library(DESeq2)
+library(tximport)
+library(readr)
+
+####fishpond libraries
+library(fishpond)
+library(tximeta)
+library(SummarizedExperiment)
+####Other libraries
+library(optparse)
+#library(xlsx)
+#options(java.parameters = "-Xmx4G")
+library(dplyr)
+library(pheatmap)
+library(RColorBrewer)
+library(ggplot2)
+library(vsn)
+library(crayon)
+library(tidytable)
+library(data.table)
+
+
+################################################
+################################################
+## PARSE COMMAND-LINE PARAMETERS              ##
+################################################
+################################################
+cat(cyan$bgRed$bold("########################\nStarting diferential expression pipeline\n###############################\n"))
+
+option_list <- list(
+  make_option(c("-r", "--rnaseq_dir"              ), type="character" , default='../../01-rnaseq'      , metavar="path"   , help="Path to rna-seq results"                                                                                                                                                 ),
+  make_option(c("-c", "--clinical_data"           ), type="character" , default='./clinical_data.txt' , metavar="path"   , help="Path to clinical data file"                                                                                                                                              ),
+  make_option(c("-g", "--group_col"               ), type="character" , default='Group'                , metavar="string" , help="Colname with the sample classes in sample_data of the experiment for the DE."                                                                                            ),
+  make_option(c("-n", "--norm_counts"             ), type="logical"   , default=FALSE                  , metavar="boolean", help="Create table with normalized counts"                                                                                                                                     ),
+  make_option(c("-q", "--quality_plots"           ), type="logical"   , default=TRUE                   , metavar="boolean", help="Create quality plots or not."                                                                                                                                            )
+)
+
+opt_parser <- OptionParser(option_list=option_list)
+opt        <- parse_args(opt_parser)
+
+cat(blue$bold("########################\nRunning analysis with the following params:\n###############################\n"))
+cat(blue("-Path to RNAseq input folder: ")) + cat(blue(opt$rnaseq_dir))+cat(blue("\n"))
+cat(blue("-Path to samples clinical data: ")) + cat(blue(opt$clinical_data))+cat(blue("\n"))
+cat(blue("-Column with the group info: ")) + cat(blue(opt$group_col))+cat(blue("\n"))
+if (opt$norm_counts) {
+  cat(blue("-Saving normalized counts to file\n"))
+} else{
+  cat(blue("-Not saving normalized counts to file\n"))
+}
+if (opt$quality_plots) {
+  cat(blue("-Creating quality plots\n"))
+} else{
+  cat(blue("-Skipping quality plots\n"))
+}
+
+
+################################################
+################################################
+## FUNCTIONS                                  ##
+################################################
+################################################
+
+################################################
+## LOAD DATA                                  ##
+################################################
+
+####LOAD CLINICAL DATA FILE#########################
+load_sample_data <- function(clinical_data, group) {
+  samples <- read.table(clinical_data, header = T)
+  compare_col <- which(colnames(samples) %in% group)
+  time_col <- which(colnames(samples) %in% c("time"))
+  samples <- samples[,c(1,compare_col, time_col)]
+  colnames(samples) <- c("names","condition", "time")
+  rownames(samples) <- samples$names
+  return(samples)
+}
+
+################################################
+## DESEQ2                                     ##
+################################################
+
+####DIFFERENTIAL EXPRESSION#########################
+
+deseq2_analysis <- function(txi_data, samples, compare_char1, compare_char2){
+  ddsTxi <- DESeqDataSetFromTximport(txi_data,
+                                     colData = samples,
+                                     design = ~ condition + time + condition:time)
+  dds <- ddsTxi[ rowSums(counts(ddsTxi)) >= 1, ]
+  dds <- DESeq(dds, test = "LRT", reduced = ~ condition + time)
+  res <- results(dds)
+  return(list(dds_matrix = dds, results =res))
+}
+
+####NORMALIZATION#########################
+
+normalized_counts <- function(dds_table){
+  ntd <- normTransform(dds_table)
+  rld <- rlog(dds_table, blind=FALSE)
+  vsd <- varianceStabilizingTransformation(dds_table, blind=FALSE)
+  return(list(dds_norm=dds_table, norm = ntd, rlogtrans =rld, varstab=vsd))
+}
+
+####DE PLOTS#########################
+
+differential_plots <- function(res_de, de_results, ntd_subset, dds_subset){
+  #MA-plotThe  MA-plot  shows  the  log2  fold  changes  from  the  treatment  over  the  meanof  normalized  counts.
+  #The  average  of  counts  normalized  by  size  factor.
+  pdf(file="Differential_expression/DESeq2/maPlot_all.pdf")
+  plotMA( res_de, ylim = c(-1, 1) )
+  dev.off()
+  
+  #############DISPERSION PLOTS################
+  pdf(file="Differential_expression/DESeq2/pvalues.pdf")
+  hist( res_de$pvalue, breaks=20, col="grey", main = "pvalues test for differential expression")
+  dev.off()
+  
+  ##############PHEATMAP##############
+  assay_ntd <- assay(ntd_subset)
+  ordered_table <- de_results[order(de_results$pvalue, -abs(de_results$log2FoldChange)),]
+  ordered_table$identifier <- rownames(ordered_table)
+  col_num <- which(colnames(ordered_table) == "identifier")
+  top_sig_genes <- ordered_table[1:20,col_num]
+  select <- which(rownames(assay_ntd) %in% top_sig_genes)
+  df <- as.data.frame(colData(dds_subset)[,c("condition")])
+  colnames(df) <- c("condition")
+  rownames(df) <- colnames(ntd_subset)
+  to_plot <- assay_ntd[select,]
+  to_plot_geneid <- as.data.frame(rownames(to_plot))
+  colnames(to_plot_geneid) <- "GeneID"
+  to_plot_geneid_merged <- merge(x = to_plot_geneid, y = gene_genename, by.x="GeneID", by.y = "GENEID", all.x = TRUE, all.y = FALSE)
+  rownames(to_plot) <- to_plot_geneid_merged$gene_name
+  pdf(file="Differential_expression/DESeq2/heatmapCount_top20_differentially_expressed.pdf")
+  pheatmap(to_plot, cluster_rows=TRUE, show_rownames=TRUE,
+           cluster_cols=TRUE, annotation_col=df, main="Top 20 significant genes")
+  dev.off()
+}
+
+
+####QUALITY PLOTS#########################
+
+quality_plots <- function(norm_data){
+  ###########SAMPLE DISTANCE##############
+  sampleDists <- dist( t( assay(norm_data$rlogtrans) ) )
+  
+  sampleDistMatrix <- as.matrix( sampleDists )
+  colours = colorRampPalette(rev(brewer.pal(9, "Blues"))) (255)
+  pdf(file="Quality_plots/DESeq2/heatmap_sample_to_sample.pdf")
+  pheatmap(sampleDistMatrix,
+           clustering_distance_rows=sampleDists,
+           clustering_distance_cols=sampleDists,
+           col=colours)
+  dev.off()
+  
+  #############PCA PLOTS################
+  pcaData <- plotPCA(norm_data$rlogtrans, intgroup=c("condition"), returnData=TRUE)
+  pcaData_2 <- plotPCA(norm_data$varstab, intgroup=c("condition"), returnData=TRUE)
+  percentVar <- round(100 * attr(pcaData, "percentVar"))
+  pdf(file="Quality_plots/DESeq2/plotPCA.pdf")
+  pca_plot_rld <- ggplot(pcaData, aes(PC1, PC2, color=condition)) +
+    geom_point(size=3) +
+    xlab(paste0("PC1: ",percentVar[1],"% variance")) +
+    ylab(paste0("PC2: ",percentVar[2],"% variance")) +
+    geom_text(aes(label = name), color = "black", size=2, position = position_nudge(y = 0.8)) +
+    labs(title="PCA: rlog") +
+    coord_fixed()
+  pca_plot_vsd <- ggplot(pcaData_2, aes(PC1, PC2, color=condition)) +
+    geom_point(size=3) +
+    xlab(paste0("PC1: ",percentVar[1],"% variance")) +
+    ylab(paste0("PC2: ",percentVar[2],"% variance")) +
+    geom_text(aes(label = name), color = "black", size=2, position = position_nudge(y = 0.8)) +
+    labs(title="PCA: vsd") +
+    coord_fixed()
+  print(pca_plot_rld)
+  print(pca_plot_vsd)
+  dev.off()
+  
+  #############BOX PLOTS################
+  pdf(file="Quality_plots/DESeq2/boxplot.pdf")
+  boxplot(assay(norm_data$norm), col="blue", las =2)
+  title(main="Boxplot: normalized counts")
+  boxplot(log10(assays(norm_data$dds_norm)[["cooks"]]), range=0, las=2)
+  title(main="Boxplot see outliers: cooks distance")
+  dev.off()
+  
+  #############DISPERSION PLOTS################
+  pdf(file="Quality_plots/DESeq2/plotDispersions.pdf")
+  plotDispEsts(norm_data$dds_norm)
+  dev.off()
+  
+  #############DESVIATION PLOT################
+  pdf(file="Quality_plots/DESeq2/plotSD.pdf")
+  meanSdPlot(assay(norm_data$norm))
+  dev.off()
+  
+  ##############HCLUST###################
+  assay_ntd <- assay(norm_data$norm)
+  pdf(file="Quality_plots/DESeq2/cluster_dendrogram.pdf")
+  plot(hclust(dist(t(assay_ntd)),method="average"))
+  dev.off()
+  
+  ##############PHEATMAP##############
+  select <- order(rowMeans(counts(norm_data$dds_norm,normalized=TRUE)),
+                  decreasing=TRUE)[1:20]
+  df <- as.data.frame(colData(norm_data$dds_norm)[,c("condition")])
+  colnames(df) <- c("Condition")
+  rownames(df) <- colnames(norm_data$norm)
+  
+  to_plot <- assay(norm_data$norm)[select,]
+  to_plot_geneid <- as.data.frame(rownames(to_plot))
+  colnames(to_plot_geneid) <- "GeneID"
+  to_plot_geneid_merged <- merge(x = to_plot_geneid, y = gene_genename, by.x="GeneID", by.y = "GENEID", all.x = TRUE, all.y = FALSE)
+  rownames(to_plot) <- to_plot_geneid_merged$gene_name
+  
+  pdf(file="Quality_plots/DESeq2/heatmapCount_top20_highest_expression.pdf")
+  pheatmap(to_plot, cluster_rows=FALSE, show_rownames=TRUE,
+           cluster_cols=TRUE, annotation_col=df, main="Normalized counts top 20 more expressed genes")
+  dev.off()
+  
+  ######FULL PHEATMAP#################
+  pdf(file="Quality_plots/DESeq2/heatmapCount_all_genes.pdf")
+  pheatmap(assay(norm_data$norm), cluster_rows=FALSE, show_rownames=FALSE,
+           cluster_cols=TRUE,main="Normalized counts", annotation_col=df)
+  dev.off()
+}
+
+################################################
+## WARNINGS                                   ##
+################################################
+
+test_data <- function(samples_data, txi_data){
+  if (all(rownames(samples_data) %in% colnames(txi_data$counts)) == FALSE) {
+    print("Warning: Check sample names")
+  }
+  if (all(rownames(samples_data) == colnames(txi_data$counts)) == FALSE) {
+    print("Warning: Check sample names")
+  }
+}
+
+
+##############################################################################################################################################
+##############################################################################################################################################
+##################################################### MAIN                                  ##################################################
+##############################################################################################################################################
+##############################################################################################################################################
+
+
+################################################
+################################################
+## LOAD DATA                                  ##
+################################################
+################################################
+
+cat(blue("########################\nStarting with loading data\n###############################\n"))
+
+####LOAD TRANSCRIPT RELATION DATA FILE #########################
+
+tx2gene <- read.table(file.path(opt$rnaseq_dir, "star_salmon", "salmon_tx2gene.tsv"), header = F)
+colnames(tx2gene) <- c("TXNAME", "GENEID", "gene_name")
+gene_genename <- tx2gene[,c(2:3)]
+gene_genename <- gene_genename %>% distinct()
+
+####LOAD CLINICAL DATA FILE #########################
+samples_clin_data <- load_sample_data(clinical_data = opt$clinical_data, group = opt$group_col)
+
+####LOAD ESPRESSION DATA #########################
+files <- file.path(opt$rnaseq_dir,"star_salmon", samples_clin_data$names, "quant.sf")
+names(files) <- samples_clin_data$names
+coldata <- data.frame(files, samples_clin_data, stringsAsFactors=FALSE)
+if (!all(file.exists(coldata$files))) {
+  cat(red("############WARNING############\nNo todos los ficheros existen\n###############################\n"))
+}
+
+
+################################################
+################################################
+## DIFFERENTIAL EXPRESSION                    ##
+################################################
+################################################
+
+
+################################################
+################################################
+## DIFFERENTIAL EXPRESSION DESEQ2             ##
+################################################
+################################################
+
+cat(blue("########################\nStarting with DESeq2\n###############################\n"))
+txi <- tximport(files, type="salmon", tx2gene=tx2gene)
+test_data(samples_data = samples_clin_data, txi_data = txi)
+
+cat(blue("########################\nStarting with differential expression\n###############################\n"))
+deseq2_results <- deseq2_analysis(txi_data = txi, samples = samples_clin_data, compare_char1 = opt$treatment, opt$control)
+mcols(deseq2_results$results, use.names = T)
+DE_results <- as.data.frame(deseq2_results$results)
+
+DE_results$GeneID <- row.names(DE_results)
+DE_results_merged <- merge(x = gene_genename, y = DE_results, by.x = "GENEID", by.y= "GeneID", all.y = T, all.x=F)
+
+DE_results_merged_sig <- subset(x = DE_results_merged, padj <= 0.05 & (log2FoldChange <= -2 | log2FoldChange >= 2))
+
+dir.create("Differential_expression",showWarnings = FALSE)
+dir.create("Differential_expression/DESeq2",showWarnings = FALSE)
+write.table(x = DE_results_merged, file = "Differential_expression/DESeq2/Differential_expression.csv", sep = ",", quote = F, col.names = T, row.names = F)
+#write.xlsx(x = DE_results_merged, file = "Differential_expression/DESeq2/Differential_expression.xlsx", sheetName = "Diff_exp", col.names = TRUE, row.names = FALSE, append = FALSE, showNA = TRUE, password = NULL)
+
+
+cat(blue("########################\nStarting with normalization\n###############################\n"))
+norm_count <- normalized_counts(dds_table = deseq2_results$dds_matrix)
+
+if (opt$norm_counts) {
+  ntd_gene <- as.data.frame(assay(norm_count$norm))
+  ntd_gene$GeneID <- rownames(ntd_gene)
+  norm_name_table <- merge(x = gene_genename, y = ntd_gene, by.x = "GENEID", by.y= "GeneID", all.y = T, all.x=F)
+  write.table(x = norm_name_table, file = "normalized_expression.csv", quote = F, sep = ",", row.names = F, col.names = T)
+  #write.xlsx(x = norm_name_table, file = "normalized_expression.xlsx", sheetName = "Norm_exp", col.names = TRUE, row.names = FALSE, append = FALSE, showNA = TRUE, password = NULL)
+}
+
+cat(blue("########################\nStarting with data subsettion\n###############################\n"))
+
+differential_plots(res_de = deseq2_results$results, de_results = DE_results, ntd_subset = norm_count$norm, dds_subset = norm_count$dds_norm)
+
+if (opt$quality_plots) {
+  cat(blue("########################\nStarting with Quality plots\n###############################\n"))
+  dir.create("Quality_plots",showWarnings = FALSE)
+  dir.create("Quality_plots/DESeq2",showWarnings = FALSE)
+  quality_plots(norm_data = norm_count)
+}
+
+save.image()
+cat(blue("########################\nNumber of genes with padj < 0.05 and log2FC >= |2|:\n"))
+cat(blue(nrow(DE_results_merged_sig)))
+cat(blue("\n###############################\n"))
+
+cat(green("########################\nPipeline completed succesfully\n###############################\n"))

From 577d0b55a7fdf2f559510ca2ec30ba001a81486d Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Wed, 14 Aug 2024 14:06:42 +0200
Subject: [PATCH 182/321] prettier

---
 .../time_series_differential_expression.R              | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
index 5ad14850b..de296357f 100644
--- a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
+++ b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
@@ -37,11 +37,11 @@ library(data.table)
 cat(cyan$bgRed$bold("########################\nStarting diferential expression pipeline\n###############################\n"))
 
 option_list <- list(
-  make_option(c("-r", "--rnaseq_dir"              ), type="character" , default='../../01-rnaseq'      , metavar="path"   , help="Path to rna-seq results"                                                                                                                                                 ),
-  make_option(c("-c", "--clinical_data"           ), type="character" , default='./clinical_data.txt' , metavar="path"   , help="Path to clinical data file"                                                                                                                                              ),
-  make_option(c("-g", "--group_col"               ), type="character" , default='Group'                , metavar="string" , help="Colname with the sample classes in sample_data of the experiment for the DE."                                                                                            ),
-  make_option(c("-n", "--norm_counts"             ), type="logical"   , default=FALSE                  , metavar="boolean", help="Create table with normalized counts"                                                                                                                                     ),
-  make_option(c("-q", "--quality_plots"           ), type="logical"   , default=TRUE                   , metavar="boolean", help="Create quality plots or not."                                                                                                                                            )
+  make_option(c("-r", "--rnaseq_dir"    ), type="character" , default='../../01-rnaseq'      , metavar="path"   , help="Path to rna-seq results"                                                      ),
+  make_option(c("-c", "--clinical_data" ), type="character" , default='../clinical_data.txt' , metavar="path"   , help="Path to clinical data file"                                                   ),
+  make_option(c("-g", "--group_col"     ), type="character" , default='Group'                , metavar="string" , help="Colname with the sample classes in sample_data of the experiment for the DE." ),
+  make_option(c("-n", "--norm_counts"   ), type="logical"   , default=FALSE                  , metavar="boolean", help="Create table with normalized counts"                                          ),
+  make_option(c("-q", "--quality_plots" ), type="logical"   , default=TRUE                   , metavar="boolean", help="Create quality plots or not."                                                 )
 )
 
 opt_parser <- OptionParser(option_list=option_list)

From dbf382d352ecb627be7edc755b496400198a2033 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Wed, 14 Aug 2024 14:08:15 +0200
Subject: [PATCH 183/321] Fixed new nf-core pipeline file name

---
 .../time_series_differential_expression.R                       | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
index de296357f..b7b407e3b 100644
--- a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
+++ b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
@@ -263,7 +263,7 @@ cat(blue("########################\nStarting with loading data\n################
 
 ####LOAD TRANSCRIPT RELATION DATA FILE #########################
 
-tx2gene <- read.table(file.path(opt$rnaseq_dir, "star_salmon", "salmon_tx2gene.tsv"), header = F)
+tx2gene <- read.table(file.path(opt$rnaseq_dir, "star_salmon", "tx2gene.tsv"), header = F)
 colnames(tx2gene) <- c("TXNAME", "GENEID", "gene_name")
 gene_genename <- tx2gene[,c(2:3)]
 gene_genename <- gene_genename %>% distinct()

From 4c9155b179ee348ed14dbea30c272cac9df73bcd Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Wed, 14 Aug 2024 16:38:10 +0200
Subject: [PATCH 184/321] removed unnecessary variables

---
 .../time_series_differential_expression.R                     | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
index b7b407e3b..d3358cd2c 100644
--- a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
+++ b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
@@ -90,7 +90,7 @@ load_sample_data <- function(clinical_data, group) {
 
 ####DIFFERENTIAL EXPRESSION#########################
 
-deseq2_analysis <- function(txi_data, samples, compare_char1, compare_char2){
+deseq2_analysis <- function(txi_data, samples){
   ddsTxi <- DESeqDataSetFromTximport(txi_data,
                                      colData = samples,
                                      design = ~ condition + time + condition:time)
@@ -298,7 +298,7 @@ txi <- tximport(files, type="salmon", tx2gene=tx2gene)
 test_data(samples_data = samples_clin_data, txi_data = txi)
 
 cat(blue("########################\nStarting with differential expression\n###############################\n"))
-deseq2_results <- deseq2_analysis(txi_data = txi, samples = samples_clin_data, compare_char1 = opt$treatment, opt$control)
+deseq2_results <- deseq2_analysis(txi_data = txi, samples = samples_clin_data)
 mcols(deseq2_results$results, use.names = T)
 DE_results <- as.data.frame(deseq2_results$results)
 

From f0289652edeb9de25364f8e41164ca0603c6669a Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Wed, 14 Aug 2024 16:39:00 +0200
Subject: [PATCH 185/321] Added time series plots

---
 .../time_series_differential_expression.R     | 60 +++++++++++++++++++
 1 file changed, 60 insertions(+)

diff --git a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
index d3358cd2c..57d1725f4 100644
--- a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
+++ b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
@@ -232,6 +232,49 @@ quality_plots <- function(norm_data){
   dev.off()
 }
 
+####TIME SERIES PLOTS#########################
+time_series_plots <- function(gene, res, dds) {
+  plot_name <- paste(gene, "expression.pdf", sep = "_")
+  file_path <- paste("Time_series_plots", plot_name, sep = "/")
+  index = which(rownames(res) == gene, arr.ind = TRUE)
+  gene_name <- DE_results_merged[index,2]
+  fiss <- plotCounts(dds, index, 
+                    intgroup = c("time","condition"), returnData = TRUE)
+  fiss$time <- factor(fiss$time, levels = time_order)
+  p <- ggplot(fiss, aes(x = time, y = count, color = condition, group = condition)) + 
+    geom_point() + 
+    stat_summary(fun = mean, geom = "line") +
+    scale_y_log10() +
+    labs(title = paste("Expression evolution of gene: ", gene_name, sep = ""))
+  pdf(file=file_path)
+  print(p)
+  dev.off()
+}
+
+####WALD TEST FOR TIME SERIES#########################
+
+wald_test <- function(dds, condition){
+  condition_test <- results(dds, name=condition, test="Wald")
+  print(condition_test[which.min(condition_test$padj),])
+}
+
+####BETAS PLOT FOR TIME SERIES#########################
+
+betas_plot <- function(res, dds) {
+  betas <- coef(dds)
+  colnames(betas)
+
+  topGenes <- head(order(res$padj),20)
+  mat <- betas[topGenes, -c(1,2)]
+  thr <- 3
+  mat[mat < -thr] <- -thr
+  mat[mat > thr] <- thr
+  pdf(file="Time_series_plots/betas_pheatmap.pdf")
+  pheatmap(mat, breaks=seq(from=-thr, to=thr, length=101),
+          cluster_col=TRUE, main = "log2FC of top20 significant genes")
+  dev.off()
+}
+
 ################################################
 ## WARNINGS                                   ##
 ################################################
@@ -335,6 +378,23 @@ if (opt$quality_plots) {
   quality_plots(norm_data = norm_count)
 }
 
+cat(blue("########################\nStarting with time series plots\n###############################\n"))
+
+top4 <- rownames(head(deseq2_results$dds_matrix[order(deseq2_results$results$padj),], 4))
+
+dir.create("Time_series_plots",showWarnings = FALSE)
+
+for (gene in top4) {
+  time_series_plots(gene, res = deseq2_results$results, dds = deseq2_results$dds_matrix)
+}
+
+all_conditions <- resultsNames(deseq2_results$dds_matrix)
+for (condition in all_conditions) {
+  wald_test(dds = deseq2_results$dds_matrix, condition)
+}
+
+betas_plot(res = deseq2_results$results, dds = deseq2_results$dds_matrix)
+
 save.image()
 cat(blue("########################\nNumber of genes with padj < 0.05 and log2FC >= |2|:\n"))
 cat(blue(nrow(DE_results_merged_sig)))

From dd749833271dfe32d649613b07a19932e3e88ae2 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Wed, 14 Aug 2024 16:39:25 +0200
Subject: [PATCH 186/321] Created option to pass date specific order

---
 .../time_series_differential_expression.R            | 12 +++++++++++-
 1 file changed, 11 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
index 57d1725f4..ce5b964e9 100644
--- a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
+++ b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/time_series_differential_expression.R
@@ -41,7 +41,8 @@ option_list <- list(
   make_option(c("-c", "--clinical_data" ), type="character" , default='../clinical_data.txt' , metavar="path"   , help="Path to clinical data file"                                                   ),
   make_option(c("-g", "--group_col"     ), type="character" , default='Group'                , metavar="string" , help="Colname with the sample classes in sample_data of the experiment for the DE." ),
   make_option(c("-n", "--norm_counts"   ), type="logical"   , default=FALSE                  , metavar="boolean", help="Create table with normalized counts"                                          ),
-  make_option(c("-q", "--quality_plots" ), type="logical"   , default=TRUE                   , metavar="boolean", help="Create quality plots or not."                                                 )
+  make_option(c("-q", "--quality_plots" ), type="logical"   , default=TRUE                   , metavar="boolean", help="Create quality plots or not."                                                 ),
+  make_option(c("-t", "--time_order"    ), type="character" , default=NULL                   , metavar="string" , help="Order to plot the dates as list, eg: 15D,45D,3M."                                                     )
 )
 
 opt_parser <- OptionParser(option_list=option_list)
@@ -51,6 +52,14 @@ cat(blue$bold("########################\nRunning analysis with the following par
 cat(blue("-Path to RNAseq input folder: ")) + cat(blue(opt$rnaseq_dir))+cat(blue("\n"))
 cat(blue("-Path to samples clinical data: ")) + cat(blue(opt$clinical_data))+cat(blue("\n"))
 cat(blue("-Column with the group info: ")) + cat(blue(opt$group_col))+cat(blue("\n"))
+
+if (is.null(opt$time_order)) {
+    print_help(opt_parser)
+    stop("You need to specify the order for the dates.", call.=FALSE)
+} else {
+  time_order <- unlist(strsplit(opt$time_order, ","))
+}
+
 if (opt$norm_counts) {
   cat(blue("-Saving normalized counts to file\n"))
 } else{
@@ -62,6 +71,7 @@ if (opt$quality_plots) {
   cat(blue("-Skipping quality plots\n"))
 }
 
+cat(blue("Time order: ")) + cat(blue(time_order)) +cat(blue("\n"))
 
 ################################################
 ################################################

From 2bc885194208f0409a728b71cc79e05f4f8a0999 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Fri, 16 Aug 2024 12:46:24 +0200
Subject: [PATCH 187/321] Updated changelog

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index c81d1d99d..5cf42bc41 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -62,6 +62,7 @@ Code contributions to the new version:
 - Added several improvements in lablog_viralrecon (created log files, modified check_references function behaviour, enabled config files regeneration) [#306](https://github.com/BU-ISCIII/buisciii-tools/pull/306)
 - Fixed bug when lablog_viralrecon tries to download references that don't belong to any family. [#310](https://github.com/BU-ISCIII/buisciii-tools/pull/310)
 - Added mvmoneo to SFTP users. [#317](https://github.com/BU-ISCIII/buisciii-tools/pull/317)
+- Added scripts for time series RNAseq and updated differential expression code for differentially expressed transcripts [#316](https://github.com/BU-ISCIII/buisciii-tools/pull/316)
 
 ### Modules
 

From 424a4adb70cc29be837aa824f2a91f7d9aaaf8b6 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Fri, 16 Aug 2024 13:12:14 +0200
Subject: [PATCH 188/321] Added bbaladron to SFTP users

---
 bu_isciii/templates/sftp_user.json | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bu_isciii/templates/sftp_user.json b/bu_isciii/templates/sftp_user.json
index 04773c8fb..f8ee42f60 100755
--- a/bu_isciii/templates/sftp_user.json
+++ b/bu_isciii/templates/sftp_user.json
@@ -51,5 +51,6 @@
     "ycampos": ["LabUfiecMithocondrial"],
     "anadonoso": ["Labenterovirus"],
     "mvmoneo": ["SpainUDP"],
+    "bbaladron": ["SpainUDP"],
     "bioinfoadm": ["test"]
 }

From 834c08836e7ecb0024fa424598eb5d4cbd833af7 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Fri, 16 Aug 2024 13:12:48 +0200
Subject: [PATCH 189/321] Updated changelog

---
 CHANGELOG.md | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 5cf42bc41..cc58e59f7 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -62,7 +62,8 @@ Code contributions to the new version:
 - Added several improvements in lablog_viralrecon (created log files, modified check_references function behaviour, enabled config files regeneration) [#306](https://github.com/BU-ISCIII/buisciii-tools/pull/306)
 - Fixed bug when lablog_viralrecon tries to download references that don't belong to any family. [#310](https://github.com/BU-ISCIII/buisciii-tools/pull/310)
 - Added mvmoneo to SFTP users. [#317](https://github.com/BU-ISCIII/buisciii-tools/pull/317)
-- Added scripts for time series RNAseq and updated differential expression code for differentially expressed transcripts [#316](https://github.com/BU-ISCIII/buisciii-tools/pull/316)
+- Added scripts for time series RNAseq and updated differential expression code for differentially expressed transcripts [#316](https://github.com/BU-ISCIII/buisciii-tools/pull/316).
+- Added bbaladron to SFTP users [#316](https://github.com/BU-ISCIII/buisciii-tools/pull/316).
 
 ### Modules
 

From fdf6271682aa04e9e6429c5aa5513cd0c4937120 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Mon, 19 Aug 2024 17:12:59 +0200
Subject: [PATCH 190/321] Added pikavirus configuration

---
 bu_isciii/templates/services.json | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/services.json b/bu_isciii/templates/services.json
index 3e57d041b..147277fe4 100755
--- a/bu_isciii/templates/services.json
+++ b/bu_isciii/templates/services.json
@@ -42,10 +42,10 @@
       "url": "https://github.com/BU-ISCIII/PikaVirus",
       "description": "PikaVirus, a mapping-based tool for metagenome analysis of virus.",
       "clean": {
-        "folders":[],
+        "folders":["virus_coverage/plots"],
         "files":[]
       },
-      "no_copy": ["RAW", "TMP"],
+      "no_copy": ["RAW", "TMP", "01-PikaVirus-results"],
       "last_folder":"REFERENCES",
       "delivery_md": "assets/reports/md/pikavirus.md",
       "results_md": "assets/reports/results/pikavirus.md"

From 6c9da287452afaecbc98b1a8bc2f5b7455ff02b3 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Mon, 19 Aug 2024 17:29:50 +0200
Subject: [PATCH 191/321] Added plasmidID configuration

---
 bu_isciii/templates/services.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/services.json b/bu_isciii/templates/services.json
index 147277fe4..d60131998 100755
--- a/bu_isciii/templates/services.json
+++ b/bu_isciii/templates/services.json
@@ -60,7 +60,7 @@
       "description": "Plasmid identification tool based on mapping and assisted by assembly",
       "clean": {
         "folders":["01-preprocessing/trimmed_sequences"],
-        "files":[]
+        "files":["mapping/sample_name.sorted.bam", "kmer/database.msh"]
       },
       "no_copy": ["RAW", "TMP"],
       "delivery_md": "assets/reports/md/plasmidid.md",

From 67f491bf8e67f1f1a6cf0180664e73a0243ecdc7 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Mon, 19 Aug 2024 17:32:11 +0200
Subject: [PATCH 192/321] Added wgmlst_chewbbaca configuration

---
 bu_isciii/templates/services.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/services.json b/bu_isciii/templates/services.json
index d60131998..7c8049fed 100755
--- a/bu_isciii/templates/services.json
+++ b/bu_isciii/templates/services.json
@@ -94,7 +94,7 @@
         "description": "Multilocus sequence typing (MLST) using chewBBACA",
         "depends_on": "assembly_annotation",
         "clean": {
-          "folders":["03-assembly/trimming/trimmed", "01-preprocessing/{sample_name}"],
+          "folders":[],
           "files":[]
         },
         "no_copy": ["RAW", "TMP"],

From f6e8d05b88b2f3e59f4b2af87e37f0b3296e0915 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Mon, 19 Aug 2024 17:32:52 +0200
Subject: [PATCH 193/321] Added wgmlst_ctaranis configuration

---
 bu_isciii/templates/services.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/services.json b/bu_isciii/templates/services.json
index 7c8049fed..abb0a1a2d 100755
--- a/bu_isciii/templates/services.json
+++ b/bu_isciii/templates/services.json
@@ -76,7 +76,7 @@
         "description": "Multilocus sequence typing (MLST) using Taranis",
         "depends_on": "assembly_annotation",
         "clean": {
-          "folders":["03-assembly/trimming/trimmed", "01-preprocessing"],
+          "folders":[],
           "files":[]
         },
         "no_copy": ["RAW", "TMP"],

From 616b08e0f12f5d812b360c70025aac78ea3f8865 Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Mon, 19 Aug 2024 17:38:48 +0200
Subject: [PATCH 194/321] Added characterization configuration

---
 bu_isciii/templates/services.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/services.json b/bu_isciii/templates/services.json
index abb0a1a2d..346a98727 100755
--- a/bu_isciii/templates/services.json
+++ b/bu_isciii/templates/services.json
@@ -195,7 +195,7 @@
       "end": "",
       "description": "",
       "clean": {
-        "folders":[],
+        "folders":["01-preprocessing"],
         "files":[]
       },
       "no_copy": ["RAW", "TMP", "00-reads", "fasta_inputs"],

From c39b700247e6a30a64945f76ee376d3f356bd69d Mon Sep 17 00:00:00 2001
From: "jaime.ozaez" <jaime.ozaez@gmail.com>
Date: Mon, 19 Aug 2024 17:56:10 +0200
Subject: [PATCH 195/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index cc58e59f7..42e236f2c 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -80,6 +80,7 @@ Code contributions to the new version:
 - Fixed autoclean-sftp function. [#281](https://github.com/BU-ISCIII/buisciii-tools/pull/281)
 - Fixed bioinfo_doc.py. Modified it so that this module creates a .pdf file including new-line characters, without merging lines into one single line [#259](https://github.com/BU-ISCIII/buisciii-tools/pull/259).
 - PR [#288](https://github.com/BU-ISCIII/buisciii-tools/pull/288) Fixed updating service's state to in_progress multiple times, related with issue [#285](https://github.com/BU-ISCIII/buisciii-tools/issues/285)
+- Review and update of services.json for files and folders cleaning [#318](https://github.com/BU-ISCIII/buisciii-tools/pull/318).
 
 #### Changed
 

From 3bb2d2270e57b09962cbb4b184d23b5deffafaaf Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Fri, 23 Aug 2024 16:13:03 +0200
Subject: [PATCH 196/321] added files of template characterization-taxprofiler

---
 .../ANALYSIS/ANALYSIS02_TAXPROFILING/lablog   | 91 +++++++++++++++++++
 .../ANALYSIS/lablog_taxprofiling              |  6 ++
 .../characterization/DOC/databasesheet.csv    |  6 ++
 .../DOC/hpc_slurm_taxprofiler.config          | 35 +++++++
 .../RESULTS/lablog_taxprofiling_results       |  8 ++
 5 files changed, 146 insertions(+)
 create mode 100644 bu_isciii/templates/characterization/ANALYSIS/ANALYSIS02_TAXPROFILING/lablog
 create mode 100644 bu_isciii/templates/characterization/ANALYSIS/lablog_taxprofiling
 create mode 100644 bu_isciii/templates/characterization/DOC/databasesheet.csv
 create mode 100644 bu_isciii/templates/characterization/DOC/hpc_slurm_taxprofiler.config
 create mode 100644 bu_isciii/templates/characterization/RESULTS/lablog_taxprofiling_results

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS02_TAXPROFILING/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS02_TAXPROFILING/lablog
new file mode 100644
index 000000000..817c77e88
--- /dev/null
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS02_TAXPROFILING/lablog
@@ -0,0 +1,91 @@
+# SETUP INTPUT SAMPLE SHEET
+ln -s ../00-reads .
+ln -s ../samples_id.txt .
+
+# Function to print colored text
+print_color() {
+    case "$2" in
+        "red")
+            echo -e "\e[1;31m$1\e[0m"
+            ;;
+        "green")
+            echo -e "\e[1;32m$1\e[0m"
+            ;;
+        "blue")
+            echo -e "\e[1;34m$1\e[0m"
+            ;;
+        *)
+            echo "$1"
+            ;;
+    esac
+}
+
+# Function to prompt with color
+prompt_with_color() {
+    read -p "$(print_color $1 'blue') $2" response
+}
+
+# Select whether to save trimmed reads
+trim_options=("Yes" "No")
+print_color "Do you want to save trimmed reads in outdir?" 'blue'
+select TRIMMED in "${trim_options[@]}"; do
+    if [ -n "$TRIMMED" ]; then
+        # rename trimmed
+        if [ "$TRIMMED" == "Yes" ] || [ "$TRIMMED" == "y" ]; then
+            SAVETRIMMED="true"
+        else 
+            SAVETRIMMED="false"
+        fi
+
+        break
+    else
+        print_color "Invalid input. Please select a valid option." 'red'
+    fi
+done
+print_color "Selected trimmed file option: $TRIMMED save trimmed" 'green'
+
+
+# Samples sheet setup
+echo "sample,run_accession,instrument_platform,fastq_1,fastq_2,fasta" > samplesheet.csv
+cat samples_id.txt | while read in; do
+	echo "${in},run1,ILLUMINA,00-reads/${in}_R1.fastq.gz,00-reads/${in}_R2.fastq.gz,"
+done >> samplesheet.csv
+
+scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+
+# slurm sbatch file setup
+cat <<EOF > taxprofiler.sbatch
+#!/bin/sh
+#SBATCH --ntasks 1
+#SBATCH --cpus-per-task 2
+#SBATCH --mem 4G
+#SBATCH --time 2:00:00
+#SBATCH --partition middle_idx
+#SBATCH --output $(date '+%Y%m%d')_taxprofiler.log
+#SBATCH --chdir $scratch_dir
+
+# module load Nextflow/23.10.0 singularity
+export NXF_OPTS="-Xms500M -Xmx10G"
+
+nextflow run /data/bi/pipelines/nf-core-taxprofiler/nf-core-taxprofiler-1.1.8 \\
+    -profile singularity \\
+    -c ../../DOC/hpc_slurm_taxprofiler.config \\
+    --input samplesheet.csv \\
+    --outdir ./ \\
+    --databases ../../DOC/databasesheet.csv \\
+    --preprocessing_qc_tool fastqc \\
+    --save_preprocessed_reads ${SAVETRIMMED} \\
+    --perform_shortread_qc true \\
+    --shortread_qc_tool fastp \\
+    --perform_shortread_hostremoval true \\
+    --hostremoval_reference /data/bi/references/eukaria/homo_sapiens/hg38/NCBI/genome/GCF_000001405.40_GRCh38.p14/GCF_000001405.40_GRCh38.p14_genomic.fna.gz \\
+    --run_kraken2 true \\
+    --run_bracken true \\
+    --run_centrifuge true \\
+    --run_kaiju true \\
+    --run_metaphlan true \\
+    --run_krona true \\
+    -resume
+EOF
+
+echo "sbatch taxprofiler.sbatch" > _01_nf_taxprofiler.sh
diff --git a/bu_isciii/templates/characterization/ANALYSIS/lablog_taxprofiling b/bu_isciii/templates/characterization/ANALYSIS/lablog_taxprofiling
new file mode 100644
index 000000000..e4a813bf5
--- /dev/null
+++ b/bu_isciii/templates/characterization/ANALYSIS/lablog_taxprofiling
@@ -0,0 +1,6 @@
+mkdir -p 00-reads
+
+cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R1*.fastq.gz %_R1.fastq.gz" | bash; cd -
+cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R2*.fastq.gz %_R2.fastq.gz" | bash; cd -
+
+mv ANALYSIS02_TAXPROFILING $(date '+%Y%m%d')_ANALYSIS02_TAXPROFILING
diff --git a/bu_isciii/templates/characterization/DOC/databasesheet.csv b/bu_isciii/templates/characterization/DOC/databasesheet.csv
new file mode 100644
index 000000000..811e462c1
--- /dev/null
+++ b/bu_isciii/templates/characterization/DOC/databasesheet.csv
@@ -0,0 +1,6 @@
+tool,db_name,db_params,db_path
+kraken2,db1,,/data/bi/references/kraken/minikraken_8GB_20200312.tgz
+bracken,db2,,/data/bi/references/bracken/bracken_minikraken_8GB_20200312.tgz
+centrifuge,db3,,/data/bi/references/centrifuge/201612_centrifuge_index_p+h+v.tar.gz
+metaphlan,db4,,/data/bi/references/metaphlan/mpa_vJun23_CHOCOPhlAnSGB_20240/
+kaiju,db5,,/data/bi/references/kaiju/nr_euk_2023-05-10/
\ No newline at end of file
diff --git a/bu_isciii/templates/characterization/DOC/hpc_slurm_taxprofiler.config b/bu_isciii/templates/characterization/DOC/hpc_slurm_taxprofiler.config
new file mode 100644
index 000000000..bfbc4ac15
--- /dev/null
+++ b/bu_isciii/templates/characterization/DOC/hpc_slurm_taxprofiler.config
@@ -0,0 +1,35 @@
+/*
+    HPC XTUTATIS CONFIGURATION
+*/
+
+singularity {
+        enabled                 = true
+        autoMounts              = true
+        singularity.cacheDir    = '/data/cnm/ratb/pipelines/singularity-images/'
+}
+
+process {
+        executor        = 'slurm'
+        queue           = 'middle_idx'
+        jobName         = { "$task.name - $task.hash" }
+        conda           = null
+
+        errorStrategy   = { task.exitStatus in ((130..145) + 104) ? 'retry' : 'finish' }
+
+    withName:'KAIJU_KAIJU' {
+                errorStrategy = { task.exitStatus in [143,137,21,1] ? 'retry' : 'finish' }
+        maxRetries    = 3
+                memory = { 72.GB * task.attempt }
+                time = { 8.h }
+        }
+}
+
+params {
+        max_memory = 376.GB
+        max_cpus = 32
+        max_time = '24.h'
+}
+
+/*
+    Custom base.config
+*/
diff --git a/bu_isciii/templates/characterization/RESULTS/lablog_taxprofiling_results b/bu_isciii/templates/characterization/RESULTS/lablog_taxprofiling_results
new file mode 100644
index 000000000..f980497de
--- /dev/null
+++ b/bu_isciii/templates/characterization/RESULTS/lablog_taxprofiling_results
@@ -0,0 +1,8 @@
+DELIVERY_FOLDER="$(date '+%Y%m%d')_entrega01"
+mkdir -p $DELIVERY_FOLDER/taxprofiling
+
+# Taxprofiling service
+cd $DELIVERY_FOLDER/taxprofiling
+
+# Links to reports
+ln -s ../../../ANALYSIS/*ANALYSIS02_TAXPROFILING/results/multiqc/multiqc_report.html .
\ No newline at end of file

From f74e4848db9c91e704c15d6a36f4e243343a3263 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Fri, 23 Aug 2024 16:24:26 +0200
Subject: [PATCH 197/321] fixed file end lines

---
 bu_isciii/templates/characterization/DOC/databasesheet.csv      | 2 +-
 .../characterization/RESULTS/lablog_taxprofiling_results        | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/characterization/DOC/databasesheet.csv b/bu_isciii/templates/characterization/DOC/databasesheet.csv
index 811e462c1..a227b08c7 100644
--- a/bu_isciii/templates/characterization/DOC/databasesheet.csv
+++ b/bu_isciii/templates/characterization/DOC/databasesheet.csv
@@ -3,4 +3,4 @@ kraken2,db1,,/data/bi/references/kraken/minikraken_8GB_20200312.tgz
 bracken,db2,,/data/bi/references/bracken/bracken_minikraken_8GB_20200312.tgz
 centrifuge,db3,,/data/bi/references/centrifuge/201612_centrifuge_index_p+h+v.tar.gz
 metaphlan,db4,,/data/bi/references/metaphlan/mpa_vJun23_CHOCOPhlAnSGB_20240/
-kaiju,db5,,/data/bi/references/kaiju/nr_euk_2023-05-10/
\ No newline at end of file
+kaiju,db5,,/data/bi/references/kaiju/nr_euk_2023-05-10/
diff --git a/bu_isciii/templates/characterization/RESULTS/lablog_taxprofiling_results b/bu_isciii/templates/characterization/RESULTS/lablog_taxprofiling_results
index f980497de..7d5cce5cf 100644
--- a/bu_isciii/templates/characterization/RESULTS/lablog_taxprofiling_results
+++ b/bu_isciii/templates/characterization/RESULTS/lablog_taxprofiling_results
@@ -5,4 +5,4 @@ mkdir -p $DELIVERY_FOLDER/taxprofiling
 cd $DELIVERY_FOLDER/taxprofiling
 
 # Links to reports
-ln -s ../../../ANALYSIS/*ANALYSIS02_TAXPROFILING/results/multiqc/multiqc_report.html .
\ No newline at end of file
+ln -s ../../../ANALYSIS/*ANALYSIS02_TAXPROFILING/results/multiqc/multiqc_report.html .

From d61a555cecf36b22feaa3659b593a77a85d2a5a1 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Fri, 23 Aug 2024 16:38:03 +0200
Subject: [PATCH 198/321] update changelog #320

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 42e236f2c..42f918ab2 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -64,6 +64,7 @@ Code contributions to the new version:
 - Added mvmoneo to SFTP users. [#317](https://github.com/BU-ISCIII/buisciii-tools/pull/317)
 - Added scripts for time series RNAseq and updated differential expression code for differentially expressed transcripts [#316](https://github.com/BU-ISCIII/buisciii-tools/pull/316).
 - Added bbaladron to SFTP users [#316](https://github.com/BU-ISCIII/buisciii-tools/pull/316).
+- Added new template for comprehensive taxonomy profiling using the nf-core/taxprofiler pipeline [#320](https://github.com/BU-ISCIII/buisciii-tools/pull/320).
 
 ### Modules
 

From f0a183ee42cd2f7482d6192efba93b63fdee5934 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Fri, 30 Aug 2024 09:45:47 +0200
Subject: [PATCH 199/321] uppdate execution time and database paths

---
 .../characterization/ANALYSIS/ANALYSIS02_TAXPROFILING/lablog  | 2 +-
 bu_isciii/templates/characterization/DOC/databasesheet.csv    | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS02_TAXPROFILING/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS02_TAXPROFILING/lablog
index 817c77e88..e16eab703 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS02_TAXPROFILING/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS02_TAXPROFILING/lablog
@@ -59,7 +59,7 @@ cat <<EOF > taxprofiler.sbatch
 #SBATCH --ntasks 1
 #SBATCH --cpus-per-task 2
 #SBATCH --mem 4G
-#SBATCH --time 2:00:00
+#SBATCH --time 24:00:00
 #SBATCH --partition middle_idx
 #SBATCH --output $(date '+%Y%m%d')_taxprofiler.log
 #SBATCH --chdir $scratch_dir
diff --git a/bu_isciii/templates/characterization/DOC/databasesheet.csv b/bu_isciii/templates/characterization/DOC/databasesheet.csv
index a227b08c7..18b4afee6 100644
--- a/bu_isciii/templates/characterization/DOC/databasesheet.csv
+++ b/bu_isciii/templates/characterization/DOC/databasesheet.csv
@@ -1,6 +1,6 @@
 tool,db_name,db_params,db_path
-kraken2,db1,,/data/bi/references/kraken/minikraken_8GB_20200312.tgz
-bracken,db2,,/data/bi/references/bracken/bracken_minikraken_8GB_20200312.tgz
+kraken2,db1,,/data/bi/references/kraken/k2_standard_16gb_20240605.tar.gz
+bracken,db2,,/data/bi/references/kraken/k2_standard_16gb_20240605.tar.gz
 centrifuge,db3,,/data/bi/references/centrifuge/201612_centrifuge_index_p+h+v.tar.gz
 metaphlan,db4,,/data/bi/references/metaphlan/mpa_vJun23_CHOCOPhlAnSGB_20240/
 kaiju,db5,,/data/bi/references/kaiju/nr_euk_2023-05-10/

From 180447ba23800402a6c7210c05b96d8134907541 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Fri, 30 Aug 2024 10:14:32 +0200
Subject: [PATCH 200/321] relocated template taxprofiler

---
 .../characterization/RESULTS/lablog_taxprofiling_results  | 8 --------
 .../ANALYSIS/ANALYSIS01_TAXPROFILER}/lablog               | 4 ++--
 .../ANALYSIS/lablog_taxprofiler}                          | 2 +-
 .../{characterization => mag}/DOC/databasesheet.csv       | 0
 .../DOC/taxprofiler.config}                               | 0
 .../templates/mag/RESULTS/lablog_taxprofiler_results      | 8 ++++++++
 6 files changed, 11 insertions(+), 11 deletions(-)
 delete mode 100644 bu_isciii/templates/characterization/RESULTS/lablog_taxprofiling_results
 rename bu_isciii/templates/{characterization/ANALYSIS/ANALYSIS02_TAXPROFILING => mag/ANALYSIS/ANALYSIS01_TAXPROFILER}/lablog (96%)
 rename bu_isciii/templates/{characterization/ANALYSIS/lablog_taxprofiling => mag/ANALYSIS/lablog_taxprofiler} (78%)
 rename bu_isciii/templates/{characterization => mag}/DOC/databasesheet.csv (100%)
 rename bu_isciii/templates/{characterization/DOC/hpc_slurm_taxprofiler.config => mag/DOC/taxprofiler.config} (100%)
 create mode 100755 bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results

diff --git a/bu_isciii/templates/characterization/RESULTS/lablog_taxprofiling_results b/bu_isciii/templates/characterization/RESULTS/lablog_taxprofiling_results
deleted file mode 100644
index 7d5cce5cf..000000000
--- a/bu_isciii/templates/characterization/RESULTS/lablog_taxprofiling_results
+++ /dev/null
@@ -1,8 +0,0 @@
-DELIVERY_FOLDER="$(date '+%Y%m%d')_entrega01"
-mkdir -p $DELIVERY_FOLDER/taxprofiling
-
-# Taxprofiling service
-cd $DELIVERY_FOLDER/taxprofiling
-
-# Links to reports
-ln -s ../../../ANALYSIS/*ANALYSIS02_TAXPROFILING/results/multiqc/multiqc_report.html .
diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS02_TAXPROFILING/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_TAXPROFILER/lablog
similarity index 96%
rename from bu_isciii/templates/characterization/ANALYSIS/ANALYSIS02_TAXPROFILING/lablog
rename to bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_TAXPROFILER/lablog
index e16eab703..06bd2f6bf 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS02_TAXPROFILING/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_TAXPROFILER/lablog
@@ -65,11 +65,11 @@ cat <<EOF > taxprofiler.sbatch
 #SBATCH --chdir $scratch_dir
 
 # module load Nextflow/23.10.0 singularity
-export NXF_OPTS="-Xms500M -Xmx10G"
+export NXF_OPTS="-Xms500M -Xmx6G"
 
 nextflow run /data/bi/pipelines/nf-core-taxprofiler/nf-core-taxprofiler-1.1.8 \\
     -profile singularity \\
-    -c ../../DOC/hpc_slurm_taxprofiler.config \\
+    -c ../../DOC/taxprofiler.config \\
     --input samplesheet.csv \\
     --outdir ./ \\
     --databases ../../DOC/databasesheet.csv \\
diff --git a/bu_isciii/templates/characterization/ANALYSIS/lablog_taxprofiling b/bu_isciii/templates/mag/ANALYSIS/lablog_taxprofiler
similarity index 78%
rename from bu_isciii/templates/characterization/ANALYSIS/lablog_taxprofiling
rename to bu_isciii/templates/mag/ANALYSIS/lablog_taxprofiler
index e4a813bf5..f6a3f119b 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/lablog_taxprofiling
+++ b/bu_isciii/templates/mag/ANALYSIS/lablog_taxprofiler
@@ -3,4 +3,4 @@ mkdir -p 00-reads
 cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R1*.fastq.gz %_R1.fastq.gz" | bash; cd -
 cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R2*.fastq.gz %_R2.fastq.gz" | bash; cd -
 
-mv ANALYSIS02_TAXPROFILING $(date '+%Y%m%d')_ANALYSIS02_TAXPROFILING
+mv ANALYSIS01_TAXPROFILER $(date '+%Y%m%d')_ANALYSIS01_TAXPROFILER
diff --git a/bu_isciii/templates/characterization/DOC/databasesheet.csv b/bu_isciii/templates/mag/DOC/databasesheet.csv
similarity index 100%
rename from bu_isciii/templates/characterization/DOC/databasesheet.csv
rename to bu_isciii/templates/mag/DOC/databasesheet.csv
diff --git a/bu_isciii/templates/characterization/DOC/hpc_slurm_taxprofiler.config b/bu_isciii/templates/mag/DOC/taxprofiler.config
similarity index 100%
rename from bu_isciii/templates/characterization/DOC/hpc_slurm_taxprofiler.config
rename to bu_isciii/templates/mag/DOC/taxprofiler.config
diff --git a/bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results b/bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results
new file mode 100755
index 000000000..d6231a54b
--- /dev/null
+++ b/bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results
@@ -0,0 +1,8 @@
+DELIVERY_FOLDER="$(date '+%Y%m%d')_entrega01"
+mkdir -p $DELIVERY_FOLDER/taxprofiler
+
+# Taxprofiling service
+cd $DELIVERY_FOLDER/taxprofiler
+
+# Links to reports
+ln -s ../../../ANALYSIS/*ANALYSIS01_TAXPROFILER/results/multiqc/multiqc_report.html .

From 9ccbdcba28ab452c3d66686eb348415a037a97d1 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Fri, 30 Aug 2024 11:33:02 +0200
Subject: [PATCH 201/321] udpdate documentation of template taxprofiler

---
 README.md                               |   7 +-
 bu_isciii/assets/reports/md/mag.md      | 687 +++++++++++++++++++++++-
 bu_isciii/assets/reports/results/mag.md |   9 +
 bu_isciii/templates/services.json       |   4 +-
 4 files changed, 701 insertions(+), 6 deletions(-)

diff --git a/README.md b/README.md
index 138380a1a..fa4f2e68f 100644
--- a/README.md
+++ b/README.md
@@ -148,9 +148,10 @@ Output:
 │                        │ control, host removal and exploratory     │                                            │
 │                        │ analysis of samples.                      │                                            │
 │ ariba_characterization │                                           │                                            │
-│                mag_met │ Bioinformatics best-practise analysis     │ https://github.com/nf-core/mag             │
-│                        │ pipeline for assembly, binning and        │                                            │
-│                        │ annotation of metagenomes.                │                                            │
+│                mag_met │ 1- Bioinformatics best-practise analysis  │ https://github.com/nf-core/mag or          │
+│                        │ for taxonomic classification and          │ https://github.com/nf-core/taxprofiler     │
+│                        │ profiling; 2- Bioinformatics best-practise│                                            │
+│                        │ analysis pipeline for assembly, binning   │                                            │
 └────────────────────────┴───────────────────────────────────────────┴────────────────────────────────────────────┘
 ```
 
diff --git a/bu_isciii/assets/reports/md/mag.md b/bu_isciii/assets/reports/md/mag.md
index 1b216b9ea..67ef902a2 100644
--- a/bu_isciii/assets/reports/md/mag.md
+++ b/bu_isciii/assets/reports/md/mag.md
@@ -749,4 +749,689 @@ Summary tool-specific plots and tables of following tools are currently displaye
 
 </details>
 
-[Nextflow](https://www.nextflow.io/docs/latest/tracing.html) provides excellent functionality for generating various reports relevant to the running and execution of the pipeline. This will allow you to troubleshoot errors with the running of the pipeline, and also provide you with other information such as launch commands, run times and resource usage.
\ No newline at end of file
+[Nextflow](https://www.nextflow.io/docs/latest/tracing.html) provides excellent functionality for generating various reports relevant to the running and execution of the pipeline. This will allow you to troubleshoot errors with the running of the pipeline, and also provide you with other information such as launch commands, run times and resource usage.
+
+# nf-core/taxprofiler: Output
+
+## Introduction
+
+This document describes the output produced by the pipeline. Most of the plots are taken from the MultiQC report, which summarises results at the end of the pipeline.
+
+The directories listed below will be created in the results directory after the pipeline has finished. All paths are relative to the top-level results directory.
+
+## Pipeline overview
+
+The pipeline is built using [Nextflow](https://www.nextflow.io/) and processes data using the following steps:
+
+- [UNTAR](#untar) - Optionally saved decompressed input databases
+- [FastQC](#fastqc) - Raw read QC
+- [falco](#fastqc) - Alternative to FastQC for raw read QC
+- [fastp](#fastp) - Adapter trimming for Illumina data
+- [AdapterRemoval](#adapterremoval) - Adapter trimming for Illumina data
+- [Porechop](#porechop) - Adapter removal for Oxford Nanopore data
+- [BBDuk](#bbduk) - Quality trimming and filtering for Illumina data
+- [PRINSEQ++](#prinseq) - Quality trimming and filtering for Illunina data
+- [Filtlong](#filtlong) - Quality trimming and filtering for Nanopore data
+- [Bowtie2](#bowtie2) - Host removal for Illumina reads
+- [minimap2](#minimap2) - Host removal for Nanopore reads
+- [SAMtools stats](#samtools-stats) - Statistics from host removal
+- [SAMtools fastq](#samtools-fastq) - Converts unmapped BAM file to fastq format (minimap2 only)
+- [Analysis Ready Reads](#analysis-read-reads) - Optional results directory containing the final processed reads used as input for classification/profiling.
+- [Bracken](#bracken) - Taxonomic classifier using k-mers and abundance estimations
+- [Kraken2](#kraken2) - Taxonomic classifier using exact k-mer matches
+- [KrakenUniq](#krakenuniq) - Taxonomic classifier that combines the k-mer-based classification and the number of unique k-mers found in each species
+- [Centrifuge](#centrifuge) - Taxonomic classifier that uses a novel indexing scheme based on the Burrows-Wheeler transform (BWT) and the Ferragina-Manzini (FM) index.
+- [Kaiju](#kaiju) - Taxonomic classifier that finds maximum (in-)exact matches on the protein-level.
+- [Diamond](#diamond) - Sequence aligner for protein and translated DNA searches.
+- [MALT](#malt) - Sequence alignment and analysis tool designed for processing high-throughput sequencing data, especially in the context of metagenomics
+- [MetaPhlAn](#metaphlan) - Genome-level marker gene based taxonomic classifier
+- [mOTUs](#motus) - Tool for marker gene-based OTU (mOTU) profiling.
+- [KMCP](#kmcp) - Taxonomic classifier that utilizes genome coverage information by splitting the reference genomes into chunks and stores k-mers in a modified and optimized COBS index for fast alignment-free sequence searching.
+- [ganon](#ganon) - Taxonomic classifier and profile that uses Interleaved Bloom Filters as indices based on k-mers/minimizers.
+- [TAXPASTA](#taxpasta) - Tool to standardise taxonomic profiles as well as merge profiles across samples from the same database and classifier/profiler.
+- [MultiQC](#multiqc) - Aggregate report describing results and QC from the whole pipeline
+- [Pipeline information](#pipeline-information) - Report metrics generated during the workflow execution
+
+![](images/taxprofiler_tube.png)
+
+### untar
+
+untar is used in nf-core/taxprofiler to decompress various input files ending in `.tar.gz`. This process is mainly used for decompressing input database archive files.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `untar/`
+  - `database/`
+    - `<database_file_name>`: directory containing contents of the decompressed archive
+
+</details>
+
+This directory will only be present if `--save_untarred_databases` is supplied. The contained directories can be useful for moving the decompressed directories to a central 'cache' location allowing users to re-use the same databases. This is useful to save unnecessary computational time of decompressing the archives on every run.
+
+### FastQC or Falco
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `{fastqc,falco}/`
+  - {raw,preprocessed}
+    - `*html`: FastQC or Falco report containing quality metrics in HTML format.
+    - `*.txt`: FastQC or Falco report containing quality metrics in TXT format.
+    - `*.zip`: Zip archive containing the FastQC report, tab-delimited data file and plot images (FastQC only).
+
+</details>
+
+[FastQC](http://www.bioinformatics.babraham.ac.uk/projects/fastqc/) gives general quality metrics about your sequenced reads. It provides information about the quality score distribution across your reads, per base sequence content (%A/T/G/C), adapter contamination and overrepresented sequences. For further reading and documentation see the [FastQC help pages](http://www.bioinformatics.babraham.ac.uk/projects/fastqc/Help/).
+
+If preprocessing is turned on, nf-core/taxprofiler runs FastQC/Falco twice -once before and once after adapter removal/read merging, to allow evaluation of the performance of these preprocessing steps. Note in the General Stats table, the columns of these two instances of FastQC/Falco are placed next to each other to make it easier to evaluate. However, the columns of the actual preprocessing steps (i.e, fastp, AdapterRemoval, and Porechop) will be displayed _after_ the two FastQC/Falco columns, even if they were run 'between' the two FastQC/Falco jobs in the pipeline itself.
+
+:::info
+Falco produces identical output to FastQC but in the `falco/` directory.
+:::
+
+![MultiQC - FastQC sequence counts plot](images/mqc_fastqc_counts.png)
+
+![MultiQC - FastQC mean quality scores plot](images/mqc_fastqc_quality.png)
+
+![MultiQC - FastQC adapter content plot](images/mqc_fastqc_adapter.png)
+
+:::note
+The FastQC plots displayed in the MultiQC report shows _untrimmed_ reads. They may contain adapter sequence and potentially regions with low quality.
+:::
+
+### fastp
+
+[fastp](https://github.com/OpenGene/fastp) is a FASTQ pre-processing tool for quality control, trimmming of adapters, quality filtering and other features.
+
+It is used in nf-core/taxprofiler for adapter trimming of short-reads.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `fastp/`
+  - `<sample_id>.fastp.fastq.gz`: File with the trimmed unmerged fastq reads.
+  - `<sample_id>.merged.fastq.gz`: File with the reads that were successfully merged.
+  - `<sample_id>.*{log,html,json}`: Log files in different formats.
+
+</details>
+
+By default nf-core/taxprofiler will only provide the `<sample_id>.fastp.fastq.gz` file if fastp is selected. The file `<sample_id>.merged.fastq.gz` will be available in the output folder if you provide the argument ` --shortread_qc_mergepairs` (optionally retaining un-merged pairs when in combination with `--shortread_qc_includeunmerged`).
+
+You can change the default value for low complexity filtering by using the argument `--shortread_complexityfilter_fastp_threshold`.
+
+### AdapterRemoval
+
+[AdapterRemoval](https://adapterremoval.readthedocs.io/en/stable/) searches for and removes remnant adapter sequences from High-Throughput Sequencing (HTS) data and (optionally) trims low quality bases from the 3' end of reads following adapter removal. It is popular in the field of palaeogenomics. The output logs are stored in the results folder, and as a part of the MultiQC report.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `adapterremoval/`
+  - `<sample_id>.settings`: AdapterRemoval log file containing general adapter removal, read trimming and merging statistics
+  - `<sample_id>.collapsed.fastq.gz` - read-pairs that merged and did not undergo trimming (only when `--shortread_qc_mergepairs` supplied)
+  - `<sample_id>.collapsed.truncated.fastq.gz` - read-pairs that merged underwent quality trimming (only when `--shortread_qc_mergepairs` supplied)
+  - `<sample_id>.pair1.truncated.fastq.gz` - read 1 of pairs that underwent quality trimming
+  - `<sample_id>.pair2.truncated.fastq.gz` - read 2 of pairs that underwent quality trimming (and could not merge if `--shortread_qc_mergepairs` supplied)
+  - `<sample_id>.singleton.truncated.fastq.gz` - orphaned read pairs where one of the pair was discarded
+  - `<sample_id>.discard.fastq.gz` - reads that were discarded due to length or quality filtering
+
+</details>
+
+By default nf-core/taxprofiler will only provide the `.settings` file if AdapterRemoval is selected.
+
+You will only find the `.fastq` files in the results directory if you provide ` --save_preprocessed_reads`. If this is selected, you may receive different combinations of `.fastq` files for each sample depending on the input types - e.g. whether you have merged or not, or if you're supplying both single- and paired-end reads. Alternatively, if you wish only to have the 'final' reads that go into classification/profiling (i.e., that may have additional processing), do not specify this flag but rather specify `--save_analysis_ready_reads`, in which case the reads will be in the folder `analysis_ready_reads`.
+
+:::warning
+The resulting `.fastq` files may _not_ always be the 'final' reads that go into taxprofiling, if you also run other steps such as complexity filtering, host removal, run merging etc..
+:::
+
+### Porechop
+
+[Porechop](https://github.com/rrwick/Porechop) is a tool for finding and removing adapters from Oxford Nanopore reads. Adapters on the ends of reads are trimmed and if a read has an adapter in its middle, it is considered a chimeric and it chopped into separate reads.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `porechop/`
+  - `<sample_id>.log`: Log file containing trimming statistics
+  - `<sample_id>.fastq.gz`: Adapter-trimmed file
+
+</details>
+
+The output logs are saved in the output folder and are part of MultiQC report.You do not normally need to check these manually.
+
+You will only find the `.fastq` files in the results directory if you provide ` --save_preprocessed_reads`. Alternatively, if you wish only to have the 'final' reads that go into classification/profiling (i.e., that may have additional processing), do not specify this flag but rather specify `--save_analysis_ready_reads`, in which case the reads will be in the folder `analysis_ready_reads`.
+
+:::warning
+We do **not** recommend using Porechop if you are already trimming the adapters with ONT's basecaller Guppy.
+:::
+
+### BBDuk
+
+[BBDuk](https://jgi.doe.gov/data-and-tools/software-tools/bbtools/bb-tools-user-guide/bbduk-guide/) stands for Decontamination Using Kmers. BBDuk was developed to combine most common data-quality-related trimming, filtering, and masking operations into a single high-performance tool.
+
+It is used in nf-core/taxprofiler for complexity filtering using different algorithms. This means that it will remove reads with low sequence diversity (e.g. mono- or dinucleotide repeats).
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `bbduk/`
+  - `<sample_id>.bbduk.log`: log file containing filtering statistics
+  - `<sample_id>.fastq.gz`: resulting FASTQ file without low-complexity reads
+
+</details>
+
+By default nf-core/taxprofiler will only provide the `.log` file if BBDuk is selected as the complexity filtering tool. You will only find the complexity filtered reads in your results directory if you provide ` --save_complexityfiltered_reads`. Alternatively, if you wish only to have the 'final' reads that go into classification/profiling (i.e., that may have additional processing), do not specify this flag but rather specify `--save_analysis_ready_reads`, in which case the reads will be in the folder `analysis_ready_reads`.
+
+:::warning
+The resulting `.fastq` files may _not_ always be the 'final' reads that go into taxprofiling, if you also run other steps such as host removal, run merging etc..
+:::
+
+### PRINSEQ++
+
+[PRINSEQ++](https://github.com/Adrian-Cantu/PRINSEQ-plus-plus) is a C++ implementation of the [prinseq-lite.pl](https://prinseq.sourceforge.net/) program. It can be used to filter, reformat or trim genomic and metagenomic sequence data.
+
+It is used in nf-core/taxprofiler for complexity filtering using different algorithms. This means that it will remove reads with low sequence diversity (e.g. mono- or dinucleotide repeats).
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `prinseqplusplus/`
+  - `<sample_id>.log`: log file containing number of reads. Row IDs correspond to: `min_len, max_len, min_gc, max_gc, min_qual_score, min_qual_mean, ns_max_n, noiupac, derep, lc_entropy, lc_dust, trim_tail_left, trim_tail_right, trim_qual_left, trim_qual_right, trim_left, trim_right`
+  - `<sample_id>_good_out.fastq.gz`: resulting FASTQ file without low-complexity reads
+
+</details>
+
+By default nf-core/taxprofiler will only provide the `.log` file if PRINSEQ++ is selected as the complexity filtering tool. You will only find the complexity filtered `.fastq` files in your results directory if you supply ` --save_complexityfiltered_reads`. Alternatively, if you wish only to have the 'final' reads that go into classification/profiling (i.e., that may have additional processing), do not specify this flag but rather specify `--save_analysis_ready_reads`, in which case the reads will be in the folder `analysis_ready_reads`.
+
+:::warning
+The resulting `.fastq` files may _not_ always be the 'final' reads that go into taxprofiling, if you also run other steps such as host removal, run merging etc..
+:::
+
+### Filtlong
+
+[Filtlong](https://github.com/rrwick/Filtlong) is a quality filtering tool for long reads. It can take a set of small reads and produce a smaller, better subset.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `filtlong/`
+  - `<sample_id>_filtered.fastq.gz`: Quality or short read data filtered file
+  - `<sample_id>_filtered.log`: log file containing summary statistics
+
+</details>
+
+You will only find the `.fastq` files in the results directory if you provide ` --save_preprocessed_reads`. Alternatively, if you wish only to have the 'final' reads that go into classification/profiling (i.e., that may have additional processing), do not specify this flag but rather specify `--save_analysis_ready_reads`, in which case the reads will be in the folder `analysis_ready_reads`.
+
+:::warning
+We do _not_ recommend using Filtlong if you are performing filtering of low quality reads with ONT's basecaller Guppy.
+:::
+
+### Bowtie2
+
+[Bowtie 2](https://bowtie-bio.sourceforge.net/bowtie2/index.shtml) is an ultrafast and memory-efficient tool for aligning sequencing reads to long reference sequences. It is particularly good at aligning reads of about 50 up to 100s or 1,000s of characters, and particularly good at aligning to relatively long (e.g. mammalian) genomes.
+
+It is used with nf-core/taxprofiler to allow removal of 'host' (e.g. human) and/or other possible contaminant reads (e.g. Phi X) from short-read `.fastq` files prior to profiling.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `bowtie2/`
+  - `build/`
+    - `*.bt2`: Bowtie2 indicies of reference genome, only if `--save_hostremoval_index` supplied.
+  - `align/`
+    - `<sample_id>.bam`: BAM file containing reads that aligned against the user-supplied reference genome as well as unmapped reads
+    - `<sample_id>.bowtie2.log`: log file about the mapped reads
+    - `<sample_id>.unmapped.fastq.gz`: the off-target reads from the mapping that is used in downstream steps.
+
+</details>
+
+By default nf-core/taxprofiler will only provide the `.log` file if host removal is turned on. You will only have a `.bam` file if you specify `--save_hostremoval_bam`. This will contain _both_ mapped and unmapped reads. You will only get FASTQ files if you specify to save `--save_hostremoval_unmapped` - these contain only unmapped reads. Alternatively, if you wish only to have the 'final' reads that go into classification/profiling (i.e., that may have additional processing), do not specify this flag but rather specify `--save_analysis_ready_reads`, in which case the reads will be in the folder `analysis_ready_reads`.
+
+:::info
+Unmapped reads in FASTQ are only found in this directory for short-reads, for long-reads see [`samtools/fastq/`](#samtools-fastq).
+:::
+
+:::info
+The resulting `.fastq` files may _not_ always be the 'final' reads that go into taxprofiling, if you also run other steps such as run merging etc..
+:::
+
+:::info
+While there is a dedicated section in the MultiQC HTML for Bowtie2, these values are not displayed by default in the General Stats table. Rather, alignment statistics to host genome is reported via samtools stats module in MultiQC report for direct comparison with minimap2 (see below).
+:::
+
+### minimap2
+
+[minimap2](https://github.com/lh3/minimap2) is an alignment tool suited to mapping long reads to reference sequences.
+
+It is used with nf-core/taxprofiler to allow removal of 'host' (e.g. human) or other possible contaminant reads from long-read `.fastq` files prior to taxonomic classification/profiling.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `minimap2/`
+  - `build/`
+    - `*.mmi2`: minimap2 indices of reference genome, only if `--save_hostremoval_index` supplied.
+  - `align/`
+    - `<sample_id>.bam`: Alignment file in BAM format containing both mapped and unmapped reads.
+
+</details>
+
+By default, nf-core/taxprofiler will only provide the `.bam` file containing mapped and unmapped reads if saving of host removal for long reads is turned on via `--save_hostremoval_bam`.
+
+:::info
+minimap2 is not yet supported as a module in MultiQC and therefore there is no dedicated section in the MultiQC HTML. Rather, alignment statistics to host genome is reported via samtools stats module in MultiQC report.
+:::
+
+:::info
+Unlike Bowtie2, minimap2 does not produce an unmapped FASTQ file by itself. See [`samtools/fastq`](#samtools-fastq).
+:::
+
+### SAMtools fastq
+
+[SAMtools fastq](http://www.htslib.org/doc/1.1/samtools.html) converts a `.sam`, `.bam`, or `.cram` alignment file to FASTQ format
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `samtools/stats/`
+  - `<sample_id>_interleaved.fq.gz`: Unmapped reads only in FASTQ gzip format
+
+</details>
+
+This directory will be present and contain the unmapped reads from the `.fastq` format from long-read minimap2 host removal, if `--save_hostremoval_unmapped` is supplied. Alternatively, if you wish only to have the 'final' reads that go into classification/profiling (i.e., that may have additional processing), do not specify this flag but rather specify `--save_analysis_ready_reads`, in which case the reads will be in the folder `analysis_ready_reads`.
+
+:::info
+For short-read unmapped reads, see [bowtie2](#bowtie2).
+:::
+
+### Analysis Ready Reads
+
+:::info
+This optional results directory will only be present in the pipeline results when supplying `--save_analysis_ready_reads`.
+:::
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `samtools/stats/`
+  - `<sample_id>_{fq,fastq}.gz`: Final reads that underwent preprocessing and were sent for classification/profiling.
+
+</details>
+
+The results directory will contain the 'final' processed reads used as input for classification/profiling. It will _only_ include the output of the _last_ step of any combinations of preprocessing steps that may have been specified in the run configuration. For example, if you perform the read QC and host-removal preprocessing steps, the final reads that are sent to classification/profiling are the host-removed FASTQ files - those will be the ones present in this directory.
+
+:::warning
+If you turn off all preprocessing steps, then no results will be present in this directory. This happens independently for short- and long-reads. I.e. you will only have FASTQ files for short reads in this directory if you skip all long-read preprocessing.
+:::
+
+### SAMtools stats
+
+[SAMtools stats](http://www.htslib.org/doc/samtools-stats.html) collects statistics from a `.sam`, `.bam`, or `.cram` alignment file and outputs in a text format.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `samtools/stats/`
+  - `<sample_id>.stats`: File containing samtools stats output.
+
+</details>
+
+In most cases you do not need to check this file, as it is rendered in the MultiQC run report.
+
+### Run Merging
+
+nf-core/taxprofiler offers the option to merge FASTQ files of multiple sequencing runs or libraries that derive from the same sample, as specified in the input samplesheet.
+
+This is the last possible preprocessing step, so if you have multiple runs or libraries (and run merging turned on), this will represent the final reads that will go into classification/profiling steps.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `run_merging/`
+  - `*.fastq.gz`: Concatenated FASTQ files on a per-sample basis
+
+</details>
+
+Note that you will only find samples that went through the run merging step in this directory. For samples that had a single run or library will not go through this step of the pipeline and thus will not be present in this directory.
+
+This directory and its FASTQ files will only be present if you supply `--save_runmerged_reads`.Alternatively, if you wish only to have the 'final' reads that go into classification/profiling (i.e., that may have additional processing), do not specify this flag but rather specify `--save_analysis_ready_reads`, in which case the reads will be in the folder `analysis_ready_reads`.
+
+### Bracken
+
+[Bracken](https://ccb.jhu.edu/software/bracken/) (Bayesian Reestimation of Abundance with Kraken) is a highly accurate statistical method that computes the abundance of species in DNA sequences from a metagenomics sample. Braken uses the taxonomy labels assigned by Kraken, a highly accurate metagenomics classification algorithm, to estimate the number of reads originating from each species present in a sample.
+
+:::info
+The first step of using Bracken requires running Kraken2, therefore the initial results before abundance estimation will be found in `<your_results>/kraken2/<your_bracken_db_name>`.
+:::
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `bracken/`
+  - `<db_name>/`
+    - `bracken_<db_name>_combined_reports.txt`: combined bracken results as output from Bracken's `combine_bracken_outputs.py` script
+    - `<db_name>/`
+      - `<sample>_<db_name>.tsv`: TSV file containing per-sample summary of Bracken results with abundance information
+      - `<sample>_<db_name>.report_bracken_species.txt`: Kraken2 style report with Bracken abundance information
+
+</details>
+
+The main taxonomic profiling file from Bracken is the `*.tsv` file. This provides the basic results from Kraken2 but with the corrected abundance information. Note that the raw Kraken2 version of the upstream step of Bracken can be found in the `kraken2/` directory with the suffix of `<sample_id>_<db_name>.bracken.report.txt` (with a 6 column variant when `--save_minimizers` specified).
+
+### Kraken2
+
+[Kraken](https://ccb.jhu.edu/software/kraken2/) is a taxonomic sequence classifier that assigns taxonomic labels to DNA sequences. Kraken examines the k-mers within a query sequence and uses the information within those k-mers to query a database. That database maps -mers to the lowest common ancestor (LCA) of all genomes known to contain a given k-mer.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `kraken2/`
+  - `<db_name>_combined_reports.txt`: A combined profile of all samples aligned to a given database (as generated by `krakentools`)
+    - If you have also run Bracken, the original Kraken report (i.e., _before_ read re-assignment) will also be included in this directory with `-bracken` suffixed to your Bracken database name if you supply `--bracken_save_intermediatekraken2` to the run. For example: `kraken2-<mydatabase>-bracken.tsv`. However in most cases you want to use the actual Bracken file (i.e., `bracken_<mydatabase>.tsv`).
+  - `<db_name>/`
+    - `<sample_id>_<db_name>.classified.fastq.gz`: FASTQ file containing all reads that had a hit against a reference in the database for a given sample
+    - `<sample_id>_<db_name>.unclassified.fastq.gz`: FASTQ file containing all reads that did not have a hit in the database for a given sample
+    - `<sample_id>_<db_name>.<kraken2/bracken2>report.txt`: A Kraken2 report that summarises the fraction abundance, taxonomic ID, number of Kmers, taxonomic path of all the hits in the Kraken2 run for a given sample. Will be 6 column rather than 8 if `--save_minimizers` specified. This report will **only** be included if you supply `--bracken_save_intermediatekraken2` to the run.
+    - `<sample_id>_<db_name>.classifiedreads.txt`: A list of read IDs and the hits each read had against each database for a given sample
+
+</details>
+
+The main taxonomic classification file from Kraken2 is the `_combined_reports.txt` or `*report.txt` file. The former provides you the broadest over view of the taxonomic classification results across all samples against a single database, where you get two columns for each sample e.g. `2_all` and `2_lvl`, as well as a summarised column summing up across all samples `tot_all` and `tot_lvl`. The latter gives you the most information for a single sample. The report file is also used for the taxpasta step.
+
+You will only receive the `.fastq` and `*classifiedreads.txt` file if you supply `--kraken2_save_reads` and/or `--kraken2_save_readclassifications` parameters to the pipeline.
+
+When running Bracken, you will only get the 'intermediate' Kraken2 report files in this directory if you supply `--bracken_save_intermediatekraken2` to the run.
+
+### KrakenUniq
+
+[KrakenUniq](https://github.com/fbreitwieser/krakenuniq) (formerly KrakenHLL) is an extension to the fast k-mer-based classification performed by [Kraken](https://github.com/DerrickWood/kraken) with an efficient algorithm for additionally assessing the coverage of unique k-mers found in each species in a dataset.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `krakenuniq/`
+  - `<db_name>/`
+    - `<sample_id>_<db_name>[.merged].classified.fast{a,q}.gz`: Optional FASTA file containing all reads that had a hit against a reference in the database for a given sample. Paired-end input reads are merged in this output.
+    - `<sample_id>_<db_name>[.merged].unclassified.fast{a,q}.gz`: Optional FASTA file containing all reads that did not have a hit in the database for a given sample. Paired-end input reads are merged in this output.
+    - `<sample_id>_<db_name>.krakenuniq.report.txt`: A Kraken2-style report that summarises the fraction abundance, taxonomic ID, number of Kmers, taxonomic path of all the hits, with an additional column for k-mer coverage, that allows for more accurate distinguishing between false-positive/true-postitive hits.
+    - `<sample_id>_<db_name>.krakenuniq.classified.txt`: An optional list of read IDs and the hits each read had against each database for a given sample.
+
+</details>
+
+The main taxonomic classification file from KrakenUniq is the `*.krakenuniq.report.txt` file. This is an extension of the Kraken2 report with the additional k-mer coverage information that provides more information about the accuracy of hits.
+
+You will only receive the `.fasta.gz` and `*.krakenuniq.classified.txt` file if you supply `--krakenuniq_save_reads` and/or `--krakenuniq_save_readclassification` parameters to the pipeline.
+
+:::info
+The output system of KrakenUniq can result in other `stdout` or `stderr` logging information being saved in the report file, therefore you must check your report files before downstream use!
+:::
+
+### Centrifuge
+
+[Centrifuge](https://github.com/DaehwanKimLab/centrifuge) is a taxonomic sequence classifier that uses a Burrows-Wheeler transform and Ferragina-Manzina index for storing and mapping sequences.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `centrifuge/`
+  - `<db_name>/`
+    - `<sample_id>.centrifuge.mapped.fastq.gz`: `FASTQ` files containing all mapped reads
+    - `<sample_id>.centrifuge.report.txt`: A classification report that summarises the taxonomic ID, the taxonomic rank, length of genome sequence, number of classified and uniquely classified reads
+    - `<sample_id>.centrifuge.results.txt`: A file that summarises the classification assignment for a read, i.e read ID, sequence ID, score for the classification, score for the next best classification, number of classifications for this read
+    - `<sample_id>.centrifuge.txt`: A Kraken2-style report that summarises the fraction abundance, taxonomic ID, number of k-mers, taxonomic path of all the hits in the centrifuge run for a given sample
+    - `<sample_id>.centrifuge.unmapped.fastq.gz`: FASTQ file containing all unmapped reads
+
+</details>
+
+The main taxonomic classification files from Centrifuge are the `_combined_reports.txt`, `*report.txt`, `*results.txt` and the `*centrifuge.txt`. The latter is used by the taxpasta step. You will receive the `.fastq` files if you supply `--centrifuge_save_reads`.
+
+### Kaiju
+
+[Kaiju](https://github.com/bioinformatics-centre/kaiju) is a taxonomic classifier that finds maximum exact matches on the protein-level using the Burrows-Wheeler transform.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `kaiju/`
+  - `kaiju_<db_name>_combined_reports.txt`: A combined profile of all samples aligned to a given database (as generated by kaiju2table)
+  - `<db_name>/`
+    - `<sample_id>_<db_name>.kaiju.tsv`: Raw output from Kaiju with taxonomic rank, read ID and taxonic ID
+    - `<sample_id>_<db_name>.kaijutable.txt`: Summarised Kaiju output with fraction abundance, taxonomic ID, number of reads, and taxonomic names (as generated by `kaiju2table`)
+
+</details>
+
+The most useful summary file is the `_combined_reports.txt` file which summarises hits across all reads and samples. Separate per-sample versions summaries can be seen in `<db>/*.txt`. However if you wish to look at more precise information on a per-read basis, see the `*tsv` file. The default taxonomic rank is `species`. You can provide a different one by updating the argument `--kaiju_taxon_rank`.
+
+### DIAMOND
+
+[DIAMOND](https://github.com/bbuchfink/diamond) is a sequence aligner for translated DNA searches or protein sequences against a protein reference database such as NR. It is a replacement for the NCBI BLAST software tools.It has many key features and it is used as taxonomic classifier in nf-core/taxprofiler.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `diamond/`
+  - `<db_name>/`
+    - `<sample_id>.log`: A log file containing stdout information
+    - `<sample_id>*.{blast,xml,txt,daa,sam,tsv,paf}`: A file containing alignment information in various formats, or taxonomic information in a text-based format. Exact output depends on user choice.
+
+</details>
+
+By default you will receive a TSV output. Alternatively, you will receive a `*.sam` file if you provide the parameter `--diamond_save_reads` but in this case no taxonomic classification will be available(!), only the aligned reads in sam format.
+
+:::info
+DIAMOND has many output formats, so depending on your [choice](https://github.com/bbuchfink/diamond/wiki/3.-Command-line-options) with ` --diamond_output_format` you will receive the taxonomic information in a different format.
+:::
+
+### MALT
+
+[MALT](https://software-ab.cs.uni-tuebingen.de/download/malt) is a fast replacement for BLASTX, BLASTP and BLASTN, and provides both local and semi-global alignment capabilities.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `malt/`
+  - `<db_name>/`
+    - `<sample_id>.blastn.sam`: sparse SAM file containing alignments of each hit
+    - `<sample_id>.megan`: summary file that can be loaded into the [MEGAN6](https://uni-tuebingen.de/fakultaeten/mathematisch-naturwissenschaftliche-fakultaet/fachbereiche/informatik/lehrstuehle/algorithms-in-bioinformatics/software/megan6/) interactive viewer. Generated by MEGAN6 companion tool `rma2info`
+    - `<sample_id>.rma6`: binary file containing all alignments and taxonomic information of hits that can be loaded into the [MEGAN6](https://uni-tuebingen.de/fakultaeten/mathematisch-naturwissenschaftliche-fakultaet/fachbereiche/informatik/lehrstuehle/algorithms-in-bioinformatics/software/megan6/) interactive viewer
+    - `<sample_id>.txt.gz`: text file containing taxonomic IDs and read counts against each taxon. Generated by MEGAN6 companion tool `rma2info`
+
+</details>
+
+The main output of MALT is the `.rma6` file format, which can be only loaded into MEGAN and it's related tools. We provide the `rma2info` text files for improved compatibility with spreadsheet programs and other programmtic data manipulation tools, however this has only limited information compared to the 'binary' RMA6 file format (the `.txt` file only contains taxonomic ID and count, whereas RMA6 has taxonomic lineage information).
+
+You will only receive the `.sam` and `.megan` files if you supply `--malt_save_reads` and/or `--malt_generate_megansummary` parameters to the pipeline.
+
+### MetaPhlAn
+
+[MetaPhlAn](https://github.com/biobakery/metaphlan) is a computational tool for profiling the composition of microbial communities (Bacteria, Archaea and Eukaryotes) from metagenomic shotgun sequencing data (i.e. not 16S) with species-level resolution via marker genes.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `metaphlan/`
+  - `metaphlan_<db_name>_combined_reports.txt`: A combined profile of all samples aligned to a given database (as generated by `metaphlan_merge_tables`)
+  - `<db_name>/`
+    - `<sample_id>.biom`: taxonomic profile in BIOM format
+    - `<sample_id>.bowtie2out.txt`: BowTie2 alignment information (can be re-used for skipping alignment when re-running MetaPhlAn with different parameters)
+    - `<sample_id>_profile.txt`: MetaPhlAn taxonomic profile including abundance estimates
+
+</details>
+
+The output contains a file named `*_combined_reports.txt`, which provides an overview of the classification results for all samples. The main taxonomic profiling file from MetaPhlAn is the `*_profile.txt` file. This provides the abundance estimates from MetaPhlAn however does not include raw counts by default. Additionally, it contains intermediate Bowtie2 output `.bowtie2out.txt`, which presents a condensed representation of the mapping results of your sequencing reads to MetaPhlAn's marker gene sequences. The alignments are listed in tab-separated columns, including Read ID and Marker Gene ID, with each alignment represented on a separate line.
+
+### mOTUs
+
+[mOTUS](https://github.com/motu-tool/mOTUs) is a taxonomic profiler that maps reads to a unique marker specific database and estimates the relative abundance of known and unknown species.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `motus/`
+  - `<db_name>/`
+    - `<sample_id>.log`: A log file that contains summary statistics
+    - `<sample_id>.out`: A classification file that summarises taxonomic identifiers, by default at the rank of mOTUs (i.e., species level), and their relative abundances in the profiled sample.
+  - `motus_<db_name>_combined_reports.txt`: A combined profile of all samples aligned to a given database (as generated by `motus_merge`)
+
+</details>
+
+Normally `*_combined_reports.txt` is the most useful file for downstream analyses, but the per sample `.out` file can provide additional more specific information. By default, nf-core/taxprofiler is providing a column describing NCBI taxonomic ID as this is used in the taxpasta step. You can disable this column by activating the argument `--motus_remove_ncbi_ids`.
+You will receive the relative abundance instead of read counts if you provide the argument `--motus_use_relative_abundance`.
+
+### KMCP
+
+[KMCP](https://github.com/shenwei356/kmcp) utilises genome coverage information by splitting the reference genomes into chunks and stores k-mers in a modified and optimised COBS index for fast alignment-free sequence searching. KMCP combines k-mer similarity and genome coverage information to reduce the false positive rate of k-mer-based taxonomic classification and profiling methods.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `kmcp/`
+
+  - `<db_name>/`
+    - `<sample_id>.gz`: output of `kmcp_search` containing search sequences against a database in tab-delimited format with 15 columns.
+    - `<sample_id>_kmcp.profile`: output of `kmcp_profile` containing the taxonomic profile from search results.
+
+  </details>
+
+You will receive the `<sample_id>.gz` file if you supply `--kmcp_save_search`. Please note that there is no taxonomic label assignment in this output file.
+
+The main taxonomic classification file from KMCP is the `*kmcp.profile` which is also used by the taxpasta step.
+
+### ganon
+
+[ganon](https://pirovc.github.io/ganon/) is designed to index large sets of genomic reference sequences and to classify reads against them efficiently. The tool uses Interleaved Bloom Filters as indices based on k-mers/minimizers. It was mainly developed, but not limited, to the metagenomics classification problem: quickly assign sequence fragments to their closest reference among thousands of references. After classification, taxonomic abundance is estimated and reported.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `ganon/`
+
+  - `<db_name>/`
+
+    - `<sample_id>_report.tre`: output of `ganon report` containing taxonomic classifications with possible formatting and/or filtering depending on options specified.
+    - `<sample_id>`.tre: output of `ganon classify` containing raw taxonomic classifications and abundance estimations with no additional formatting or filtering.
+    - `<sample_id>`.rep: 'raw' report of counts against each taxon.
+    - `<sample_id>`.all: per-read summary of all hits of each reads.
+    - `<sample_id>`.lca: per-read summary of the best single hit after LCA for each read.
+    - `<sample_id>`.unc: list of read IDs with no hits.
+    - `<sample_id>`.log: the stdout console messages printed by `ganon classify`, containing some classification summary information
+
+  - `ganon_<db_name>_combined_reports.txt`: A combined profile of all samples aligned to a given database (as generated by `ganon table`)
+
+</details>
+
+Generally you will want to refer to the `combined_reports.txt` or `_report.tre` file. For further descriptions of the contents of each file, see the [ganon documentation](https://pirovc.github.io/ganon/outputfiles/).
+
+You will only receive the `.all`, `.lca`, and `.unc` files if you supply the `--ganon_save_readclassifications` parameter to the pipeline.
+
+### Krona
+
+[Krona](https://github.com/marbl/Krona) allows the exploration of (metagenomic) hierarchical data with interactive zooming, multi-layered pie charts.
+
+Krona charts will be generated by the pipeline for supported tools (Kraken2, Centrifuge, Kaiju, and MALT)
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `krona/`
+  - `<tool_name>_<db_name>.html`: per-tool/per-database interactive HTML file containing hierarchical piecharts
+
+</details>
+
+The resulting HTML files can be loaded into your web browser for exploration. Each file will have a dropdown to allow you to switch between each sample aligned against the given database of the tool.
+
+### TAXPASTA
+
+[TAXPASTA](https://github.com/taxprofiler/taxpasta) standardises and optionally merges two or more taxonomic profiles across samples into one single table. It supports multiple different classifiers simplifying comparison of taxonomic classification results between tools and databases.
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `taxpasta/`
+
+  - `<tool>_<database>*.{tsv,csv,arrow,parquet,biom}`: Standardised taxon table containing multiple samples. The standard format is the `tsv`.
+    - The first column describes the taxonomy ID and the rest of the columns describe the read counts for each sample.
+    - Note that the file naming scheme will apply regardless of whether `TAXPASTA_MERGE` (multiple sample run) or `TAXPASTA_STANDARDISE` (single sample run) are executed.
+    - If you have also run Bracken, the initial Kraken report (i.e., _before_ read re-assignment) will also be included in this directory with `-bracken` suffixed to your Bracken database name. For example: `kraken2-<mydatabase>-bracken.tsv`. However in most cases you want to use the actual Bracken file (i.e., `bracken_<mydatabase>.tsv`).
+
+  </details>
+
+By providing the path to a directory containing taxdump files to `--taxpasta_taxonomy_dir`, the taxon name, the taxon rank, the taxon's entire lineage including taxon names and/or the taxon's entire lineage including taxon identifiers can also be added in the output in addition to just the taxon ID. Addition of this extra information can be turned by using the parameters `--taxpasta_add_name`, `--taxpasta_add_rank`, `--taxpasta_add_lineage` and `--taxpasta_add_idlineage` respectively.
+
+These files will likely be the most useful files for the comparison of differences in classification between different tools or building consensuses, with the caveat they have slightly less information than the actual output from each tool (which may have non-standard information e.g. taxonomic rank, percentage of hits, abundance estimations).
+
+The following report files are used for the taxpasta step:
+
+- Bracken: `<sample>_<db_name>.tsv` Taxpasta used the `new_est_reads` column for the standardised profile.
+- Centrifuge: `<sample_id>.centrifuge.txt` Taxpasta uses the `direct_assigned_reads` column for the standardised profile.
+- Diamond: `<sample_id>` Taxpasta summarises number of reads per NCBI taxonomy ID standardised profile.
+- Kaiju: `<sample_id>_<db_name>.kaijutable.txt` Taxpasta uses the `reads` column from kaiju2table standardised profile.
+- KrakenUniq: `<sample_id>_<db_name>.report.txt` Taxpasta uses the `reads` column for the standardised profile.
+- Kraken2: `<sample_id>_<db_name>.report.txt` Taxpasta uses the `direct_assigned_reads` column for the standardised profile.
+- MALT: `<sample_id>.txt.gz` Taxpasta uses the `count` (second) column from the output of MEGAN6's rma2info for the standardised profile.
+- MetaPhlAn: `<sample_id>_profile.txt` Taxpasta uses the `relative_abundance` column multiplied with a fixed number to yield an integer for the standardised profile.
+- mOTUs: `<sample_id>.out` Taxpasta uses the `read_count` column for the standardised profile.
+
+:::warning
+Please aware the outputs of each tool's standardised profile _may not_ be directly comparable between each tool. Some may report raw read counts, whereas others may report abundance information. Please always refer to the list above, for which information is used for each tool.
+:::
+
+### MultiQC
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `multiqc/`
+  - `multiqc_report.html`: a standalone HTML file that can be viewed in your web browser.
+  - `multiqc_data/`: directory containing parsed statistics from the different tools used in the pipeline.
+  - `multiqc_plots/`: directory containing static images from the report in various formats.
+
+</details>
+
+[MultiQC](http://multiqc.info) is a visualization tool that generates a single HTML report summarising all samples in your project. Most of the pipeline QC results are visualised in the report and further statistics are available in the report data directory.
+
+Results generated by MultiQC collate pipeline QC from supported tools e.g. FastQC. The pipeline has special steps which also allow the software versions to be reported in the MultiQC output for future traceability. For more information about how to use MultiQC reports, see <http://multiqc.info>.
+
+All tools in taxprofiler supported by MultiQC will have a dedicated section showing summary statistics of each tool based on information stored in log files.
+
+You can expect in the MultiQC reports either sections and/or general stats columns for the following tools:
+
+- fastqc
+- adapterRemoval
+- fastp
+- bbduk
+- prinseqplusplus
+- porechop
+- filtlong
+- bowtie2
+- minimap2
+- samtools (stats)
+- kraken
+- bracken
+- centrifuge
+- kaiju
+- diamond
+- malt
+- motus
+
+:::info
+The 'General Stats' table by default will only show statistics referring to pre-processing steps, and will not display possible values from each classifier/profiler, unless turned on by the user within the 'Configure Columns' menu or via a custom MultiQC config file (`--multiqc_config`)
+:::
+
+### Pipeline information
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `pipeline_info/`
+  - Reports generated by Nextflow: `execution_report.html`, `execution_timeline.html`, `execution_trace.txt` and `pipeline_dag.dot`/`pipeline_dag.svg`.
+  - Reports generated by the pipeline: `pipeline_report.html`, `pipeline_report.txt` and `software_versions.yml`. The `pipeline_report*` files will only be present if the `--email` / `--email_on_fail` parameter's are used when running the pipeline.
+  - Reformatted samplesheet files used as input to the pipeline: `samplesheet.valid.csv`.
+  - Parameters used by the pipeline run: `params.json`.
+
+</details>
+
+[Nextflow](https://www.nextflow.io/docs/latest/tracing.html) provides excellent functionality for generating various reports relevant to the running and execution of the pipeline. This will allow you to troubleshoot errors with the running of the pipeline, and also provide you with other information such as launch commands, run times and resource usage.
+
diff --git a/bu_isciii/assets/reports/results/mag.md b/bu_isciii/assets/reports/results/mag.md
index 90193de6d..dd7848b73 100644
--- a/bu_isciii/assets/reports/results/mag.md
+++ b/bu_isciii/assets/reports/results/mag.md
@@ -6,3 +6,12 @@ Here we describe the results from the MAG pipeline for multispecies metagenomic
 
 > [!WARNING]
 > Software's versions used in this analysis can be obtained from the  `MultiQC` report.
+
+## Taxprofiler
+
+Here we describe the results from the (nf-core/taxprofiler)[https://nf-co.re/taxprofiler/1.1.8] pipeline for multispecies taxonomic classification and profiling of shorgun short- and long-read.
+
+* multiqc_report.html​ : Final HTML report collecting numerical stats from each module executed in this pipeline.
+
+> [!WARNING]
+> Software's versions used in this analysis can be obtained from the  `MultiQC` report.
\ No newline at end of file
diff --git a/bu_isciii/templates/services.json b/bu_isciii/templates/services.json
index 346a98727..44b5f5b68 100755
--- a/bu_isciii/templates/services.json
+++ b/bu_isciii/templates/services.json
@@ -209,8 +209,8 @@
       "order": 2,
       "begin": "base",
       "end": "",
-      "url": "https://github.com/nf-core/mag",
-      "description": "Bioinformatics best-practise analysis pipeline for assembly, binning and annotation of metagenomes.",
+      "url": "https://github.com/nf-core/mag or https://github.com/nf-core/taxprofiler",
+      "description": "1- Bioinformatics best-practise analysis for taxonomic classification and profiling; 2- Bioinformatics best-practise analysis pipeline for assembly, binning and annotation of metagenomes.",
       "clean": {
         "folders":[],
         "files":[]

From a2fb0aebbcc2bde4a5ced1f04bf42e14464e18f7 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Fri, 30 Aug 2024 13:06:08 +0200
Subject: [PATCH 202/321] fixed path to results in taxprofiler results lablog

---
 bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results b/bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results
index d6231a54b..9867e2f1d 100755
--- a/bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results
+++ b/bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results
@@ -5,4 +5,4 @@ mkdir -p $DELIVERY_FOLDER/taxprofiler
 cd $DELIVERY_FOLDER/taxprofiler
 
 # Links to reports
-ln -s ../../../ANALYSIS/*ANALYSIS01_TAXPROFILER/results/multiqc/multiqc_report.html .
+ln -s ../../../ANALYSIS/*ANALYSIS01_TAXPROFILER/multiqc/multiqc_report.html .

From fad629309cef22efc38a25a17e9facd0cfa425a5 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Fri, 30 Aug 2024 13:06:39 +0200
Subject: [PATCH 203/321] fixed indentation

---
 .../templates/mag/DOC/taxprofiler.config      | 30 +++++++++----------
 1 file changed, 15 insertions(+), 15 deletions(-)

diff --git a/bu_isciii/templates/mag/DOC/taxprofiler.config b/bu_isciii/templates/mag/DOC/taxprofiler.config
index bfbc4ac15..60569c0ac 100644
--- a/bu_isciii/templates/mag/DOC/taxprofiler.config
+++ b/bu_isciii/templates/mag/DOC/taxprofiler.config
@@ -3,31 +3,31 @@
 */
 
 singularity {
-        enabled                 = true
-        autoMounts              = true
-        singularity.cacheDir    = '/data/cnm/ratb/pipelines/singularity-images/'
+    enabled                 = true
+    autoMounts              = true
+    singularity.cacheDir    = '/data/cnm/ratb/pipelines/singularity-images/'
 }
 
 process {
-        executor        = 'slurm'
-        queue           = 'middle_idx'
-        jobName         = { "$task.name - $task.hash" }
-        conda           = null
+    executor        = 'slurm'
+    queue           = 'middle_idx'
+    jobName         = { "$task.name - $task.hash" }
+    conda           = null
 
-        errorStrategy   = { task.exitStatus in ((130..145) + 104) ? 'retry' : 'finish' }
+    errorStrategy   = { task.exitStatus in ((130..145) + 104) ? 'retry' : 'finish' }
 
     withName:'KAIJU_KAIJU' {
-                errorStrategy = { task.exitStatus in [143,137,21,1] ? 'retry' : 'finish' }
+        errorStrategy = { task.exitStatus in [143,137,21,1] ? 'retry' : 'finish' }
         maxRetries    = 3
-                memory = { 72.GB * task.attempt }
-                time = { 8.h }
-        }
+        memory = { 72.GB * task.attempt }
+        time = { 8.h }
+    }
 }
 
 params {
-        max_memory = 376.GB
-        max_cpus = 32
-        max_time = '24.h'
+    max_memory = 376.GB
+    max_cpus = 32
+    max_time = '24.h'
 }
 
 /*

From 2f16d06fb9336485fd64653af09b2ec1739f1aa7 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Fri, 30 Aug 2024 14:15:41 +0200
Subject: [PATCH 204/321] added krona rhtml to results folder

---
 bu_isciii/assets/reports/results/mag.md                    | 5 +++--
 bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results | 2 ++
 2 files changed, 5 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/assets/reports/results/mag.md b/bu_isciii/assets/reports/results/mag.md
index dd7848b73..cec03e6ba 100644
--- a/bu_isciii/assets/reports/results/mag.md
+++ b/bu_isciii/assets/reports/results/mag.md
@@ -2,7 +2,7 @@
 
 Here we describe the results from the MAG pipeline for multispecies metagenomic analysis.
 
-* krona_results.html​ : Final HTML report with the top 5 species most present in all samples.
+* `krona_results.html`​ : Final HTML report with the top 5 species most present in all samples.
 
 > [!WARNING]
 > Software's versions used in this analysis can be obtained from the  `MultiQC` report.
@@ -11,7 +11,8 @@ Here we describe the results from the MAG pipeline for multispecies metagenomic
 
 Here we describe the results from the (nf-core/taxprofiler)[https://nf-co.re/taxprofiler/1.1.8] pipeline for multispecies taxonomic classification and profiling of shorgun short- and long-read.
 
-* multiqc_report.html​ : Final HTML report collecting numerical stats from each module executed in this pipeline.
+* `multiqc_report.html​`: Final HTML report collecting numerical stats from each module executed in this pipeline.
+* `krona/*.html`: Interactive HTML files generated by Krona, displaying the results of taxonomic classification.
 
 > [!WARNING]
 > Software's versions used in this analysis can be obtained from the  `MultiQC` report.
\ No newline at end of file
diff --git a/bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results b/bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results
index 9867e2f1d..7c846010e 100755
--- a/bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results
+++ b/bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results
@@ -6,3 +6,5 @@ cd $DELIVERY_FOLDER/taxprofiler
 
 # Links to reports
 ln -s ../../../ANALYSIS/*ANALYSIS01_TAXPROFILER/multiqc/multiqc_report.html .
+ln -s ../../../ANALYSIS/*ANALYSIS01_TAXPROFILER/krona .
+

From 573758e4a57ac7830cd8e0efb4743ea09386a2c8 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Fri, 30 Aug 2024 14:21:29 +0200
Subject: [PATCH 205/321] added user to sftp

---
 bu_isciii/templates/sftp_user.json | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/sftp_user.json b/bu_isciii/templates/sftp_user.json
index f8ee42f60..2461c05d9 100755
--- a/bu_isciii/templates/sftp_user.json
+++ b/bu_isciii/templates/sftp_user.json
@@ -52,5 +52,6 @@
     "anadonoso": ["Labenterovirus"],
     "mvmoneo": ["SpainUDP"],
     "bbaladron": ["SpainUDP"],
-    "bioinfoadm": ["test"]
+    "bioinfoadm": ["test"],
+    "s.varona": ["misc"]
 }

From 708b855dd70bbe91312397b3b90c547760f9d3bd Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Fri, 30 Aug 2024 15:17:38 +0200
Subject: [PATCH 206/321] added prefix to krona html results

---
 bu_isciii/assets/reports/results/mag.md                    | 2 +-
 bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results | 6 +++++-
 2 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/assets/reports/results/mag.md b/bu_isciii/assets/reports/results/mag.md
index cec03e6ba..fa6ea6cb7 100644
--- a/bu_isciii/assets/reports/results/mag.md
+++ b/bu_isciii/assets/reports/results/mag.md
@@ -12,7 +12,7 @@ Here we describe the results from the MAG pipeline for multispecies metagenomic
 Here we describe the results from the (nf-core/taxprofiler)[https://nf-co.re/taxprofiler/1.1.8] pipeline for multispecies taxonomic classification and profiling of shorgun short- and long-read.
 
 * `multiqc_report.html​`: Final HTML report collecting numerical stats from each module executed in this pipeline.
-* `krona/*.html`: Interactive HTML files generated by Krona, displaying the results of taxonomic classification.
+* `krona/database_*.html`: Interactive HTML files generated by Krona, displaying the results of taxonomic classification for supported tools (Kraken2, Centrifuge, Kaiju, and MALT)
 
 > [!WARNING]
 > Software's versions used in this analysis can be obtained from the  `MultiQC` report.
\ No newline at end of file
diff --git a/bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results b/bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results
index 7c846010e..cfb01fa4c 100755
--- a/bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results
+++ b/bu_isciii/templates/mag/RESULTS/lablog_taxprofiler_results
@@ -6,5 +6,9 @@ cd $DELIVERY_FOLDER/taxprofiler
 
 # Links to reports
 ln -s ../../../ANALYSIS/*ANALYSIS01_TAXPROFILER/multiqc/multiqc_report.html .
-ln -s ../../../ANALYSIS/*ANALYSIS01_TAXPROFILER/krona .
+mkdir -p krona
+for file in ../../../ANALYSIS/*ANALYSIS01_TAXPROFILER/krona/*.html; do
+    base=$(basename "$file")
+    ln -s "../$file" "krona/database_${base}"
+done
 

From e61ac18b78ff2a83c52f0edb69b7d03db71d2be4 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Thu, 22 Aug 2024 09:00:37 +0200
Subject: [PATCH 207/321] added init config for mag template

---
 bu_isciii/templates/mag/DOC/mag.config | 52 +++++++++++++++++++++-----
 1 file changed, 42 insertions(+), 10 deletions(-)

diff --git a/bu_isciii/templates/mag/DOC/mag.config b/bu_isciii/templates/mag/DOC/mag.config
index 732980bf1..fdb5093e4 100644
--- a/bu_isciii/templates/mag/DOC/mag.config
+++ b/bu_isciii/templates/mag/DOC/mag.config
@@ -1,19 +1,51 @@
+/*
+    HPC XTUTATIS CONFIGURATION
+*/
+
 singularity {
-	enabled = true
-	autoMounts = true
+        enabled                 = true
+        autoMounts              = true
+        singularity.cacheDir    = '/data/bi/pipelines/singularity-images'
 }
 
 process {
-	executor = 'slurm'
-	queue = 'middle_idx'
-	queue = 'middle_idx'
-        errorStrategy = { task.exitStatus in [140,143,137,138,104,134,139] ? 'retry' : 'finish'; task.exitStatus in [1,4,255] ? 'ignore' : 'finish' }
-        maxRetries = 1
-        maxErrors = '-1'
+	executor        = 'slurm'
+	queue           = 'long_idx'
+	jobName         = { "$task.name - $task.hash" }
+	conda           = null
+
+	errorStrategy   = { task.exitStatus in ((130..145) + 104) ? 'retry' : 'finish' }
+
+	withName:'SPADES|MEGAHIT' {
+		errorStrategy = { task.exitStatus in [143,137,21,1] ? 'retry' : 'finish' }
+        maxRetries    = 2
+		cpus = { 16 * task.attempt }
+		memory = { 64.GB * task.attempt }
+		time = { 24.h }
+	}
+	withName:'MAXBIN2' {
+		// often fails when insufficient information, so we allow it to gracefully fail without failing the pipeline
+		errorStrategy = { task.exitStatus in [ 1, 255 ] ? 'ignore' : 'retry' }
+		time          = { 8.h * task.attempt }
+	}
+	withName:CONCOCT_CONCOCT {
+		errorStrategy = { task.exitStatus in [140] ? 'retry' : 'finish' }
+		maxRetries = 2
+		cpus = { 12 * task.attempt }
+		memory = { 64.GB * task.attempt }
+		time = { 12.h * task.attempt }
+	}
+	withName:CHECKM_LINEAGEWF {
+		errorStrategy = { task.exitStatus in [1] ? 'retry' : 'finish' }
+                maxRetries = 3
+                cpus = { 8 * task.attempt }
+                memory = { 32.GB * task.attempt }
+                time = { 4.h * task.attempt }
+	}
 }
 
 params {
-	max_memory = 376.GB
+	max_memory = 128.GB
 	max_cpus = 32
-	max_time = '48.h'
+	max_time = '84.h'
 }

From 0d9e3803fedbbad4df33f9046e5c077996dfd4c0 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Thu, 22 Aug 2024 09:10:36 +0200
Subject: [PATCH 208/321] added mag-complete lablogs

---
 .../ANALYSIS02_MAG/lablog_mag_complete        | 37 +++++++++++++++++++
 1 file changed, 37 insertions(+)
 create mode 100644 bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog_mag_complete

diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog_mag_complete b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog_mag_complete
new file mode 100644
index 000000000..1cc51ad6e
--- /dev/null
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog_mag_complete
@@ -0,0 +1,37 @@
+# SETUP INTPUT SAMPLE SHEET
+ln -s ../00-reads .
+ln -s ../samples_id.txt .
+
+# Setup samplesheet
+echo "sample,group,short_reads_1,short_reads_2,long_reads" > samplesheet.csv
+cat samples_id.txt | while read in; do
+	echo "${in},,00-reads/${in}_R1.fastq.gz,00-reads/${in}_R2.fastq.gz,"
+done >> samplesheet.csv
+
+scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+
+
+cat <<EOF > complete_mag.sbatch
+#!/bin/sh
+#SBATCH --ntasks 1
+#SBATCH --cpus-per-task 2
+#SBATCH --mem 8G
+#SBATCH --time 120:00:00
+#SBATCH --partition long_idx
+#SBATCH --output $(date '+%Y%m%d')_metagenomics01.log
+#SBATCH --chdir $scratch_dir
+
+# module load Nextflow/23.10.0 singularity
+export NXF_OPTS="-Xms500M -Xmx8G"
+
+nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-2.5.3/workflow/main.nf \\
+    -c ../../DOC/hpc_slurm_mag.config \\
+    -profile singularity \\
+    --input samplesheet.csv \\
+    --kraken2_db '/data/bi/references/kraken/minikraken_8GB_20200312.tgz' \\
+    --skip_spadeshybrid true \\
+    --outdir $(date '+%Y%m%d')_mag_complete \\
+    -resume
+EOF
+
+echo "sbatch complete_mag.sbatch" > _01_run_complete_mag.sh

From 1711849ff3aafaec748f296872c6364635d70d86 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Thu, 22 Aug 2024 10:29:16 +0200
Subject: [PATCH 209/321] changed comp queue

---
 bu_isciii/templates/mag/DOC/mag.config | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/bu_isciii/templates/mag/DOC/mag.config b/bu_isciii/templates/mag/DOC/mag.config
index fdb5093e4..86327ddcc 100644
--- a/bu_isciii/templates/mag/DOC/mag.config
+++ b/bu_isciii/templates/mag/DOC/mag.config
@@ -10,7 +10,7 @@ singularity {
 
 process {
 	executor        = 'slurm'
-	queue           = 'long_idx'
+	queue           = 'middle_idx'
 	jobName         = { "$task.name - $task.hash" }
 	conda           = null
 
@@ -28,14 +28,14 @@ process {
 		errorStrategy = { task.exitStatus in [ 1, 255 ] ? 'ignore' : 'retry' }
 		time          = { 8.h * task.attempt }
 	}
-	withName:CONCOCT_CONCOCT {
+	withName:'CONCOCT_CONCOCT' {
 		errorStrategy = { task.exitStatus in [140] ? 'retry' : 'finish' }
 		maxRetries = 2
 		cpus = { 12 * task.attempt }
 		memory = { 64.GB * task.attempt }
 		time = { 12.h * task.attempt }
 	}
-	withName:CHECKM_LINEAGEWF {
+	withName:'CHECKM_LINEAGEWF' {
 		errorStrategy = { task.exitStatus in [1] ? 'retry' : 'finish' }
                 maxRetries = 3
                 cpus = { 8 * task.attempt }
@@ -45,7 +45,7 @@ process {
 }
 
 params {
-	max_memory = 128.GB
+	max_memory = 376.GB
 	max_cpus = 32
-	max_time = '84.h'
+	max_time = '48.h'
 }

From 7dc3947a6fb5a105bede07a89a1ca0fb54603927 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Thu, 22 Aug 2024 10:30:32 +0200
Subject: [PATCH 210/321] renaming folders in mag template

---
 .../lablog_mag_complete => ANALYSIS01_MAG_ALL/lablog}     | 8 ++++----
 .../99-stats/lablog                                       | 0
 .../99-stats/multiqc_config.yaml                          | 0
 .../{ANALYSIS02_MAG => ANALYSIS02_MAG_TAXONOMICS}/lablog  | 0
 bu_isciii/templates/mag/ANALYSIS/lablog_mag_all           | 5 +++++
 .../mag/ANALYSIS/{lablog_mag => lablog_mag_taxonomics}    | 0
 6 files changed, 9 insertions(+), 4 deletions(-)
 rename bu_isciii/templates/mag/ANALYSIS/{ANALYSIS02_MAG/lablog_mag_complete => ANALYSIS01_MAG_ALL/lablog} (83%)
 rename bu_isciii/templates/mag/ANALYSIS/{ANALYSIS02_MAG => ANALYSIS02_MAG_TAXONOMICS}/99-stats/lablog (100%)
 rename bu_isciii/templates/mag/ANALYSIS/{ANALYSIS02_MAG => ANALYSIS02_MAG_TAXONOMICS}/99-stats/multiqc_config.yaml (100%)
 rename bu_isciii/templates/mag/ANALYSIS/{ANALYSIS02_MAG => ANALYSIS02_MAG_TAXONOMICS}/lablog (100%)
 create mode 100644 bu_isciii/templates/mag/ANALYSIS/lablog_mag_all
 rename bu_isciii/templates/mag/ANALYSIS/{lablog_mag => lablog_mag_taxonomics} (100%)

diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog_mag_complete b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_MAG_ALL/lablog
similarity index 83%
rename from bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog_mag_complete
rename to bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_MAG_ALL/lablog
index 1cc51ad6e..341c46c38 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog_mag_complete
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_MAG_ALL/lablog
@@ -11,21 +11,21 @@ done >> samplesheet.csv
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
 
-cat <<EOF > complete_mag.sbatch
+cat <<EOF > mag_complete.sbatch
 #!/bin/sh
 #SBATCH --ntasks 1
 #SBATCH --cpus-per-task 2
 #SBATCH --mem 8G
 #SBATCH --time 120:00:00
 #SBATCH --partition long_idx
-#SBATCH --output $(date '+%Y%m%d')_metagenomics01.log
+#SBATCH --output $(date '+%Y%m%d')_mag_complete.log
 #SBATCH --chdir $scratch_dir
 
 # module load Nextflow/23.10.0 singularity
 export NXF_OPTS="-Xms500M -Xmx8G"
 
 nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-2.5.3/workflow/main.nf \\
-    -c ../../DOC/hpc_slurm_mag.config \\
+    -c ../../DOC/mag.config \\
     -profile singularity \\
     --input samplesheet.csv \\
     --kraken2_db '/data/bi/references/kraken/minikraken_8GB_20200312.tgz' \\
@@ -34,4 +34,4 @@ nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-2.5.3/workflow/main.nf \
     -resume
 EOF
 
-echo "sbatch complete_mag.sbatch" > _01_run_complete_mag.sh
+echo "sbatch mag_complete.sbatch" > _01_run_mag_complete.sh
diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/99-stats/lablog
similarity index 100%
rename from bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/lablog
rename to bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/99-stats/lablog
diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/multiqc_config.yaml b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/99-stats/multiqc_config.yaml
similarity index 100%
rename from bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/99-stats/multiqc_config.yaml
rename to bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/99-stats/multiqc_config.yaml
diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog
similarity index 100%
rename from bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG/lablog
rename to bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog
diff --git a/bu_isciii/templates/mag/ANALYSIS/lablog_mag_all b/bu_isciii/templates/mag/ANALYSIS/lablog_mag_all
new file mode 100644
index 000000000..68cd3b09f
--- /dev/null
+++ b/bu_isciii/templates/mag/ANALYSIS/lablog_mag_all
@@ -0,0 +1,5 @@
+mkdir 00-reads
+cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R1*.fastq.gz %_R1.fastq.gz" | bash; cd -
+cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R2*.fastq.gz %_R2.fastq.gz" | bash; cd -
+
+mv ANALYSIS01_MAG_ALL $(date '+%Y%m%d')_ANALYSIS01_MAG_ALL
\ No newline at end of file
diff --git a/bu_isciii/templates/mag/ANALYSIS/lablog_mag b/bu_isciii/templates/mag/ANALYSIS/lablog_mag_taxonomics
similarity index 100%
rename from bu_isciii/templates/mag/ANALYSIS/lablog_mag
rename to bu_isciii/templates/mag/ANALYSIS/lablog_mag_taxonomics

From 9d542db069710b3ea0266a4c7510659ba8b4df86 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Thu, 22 Aug 2024 15:47:22 +0200
Subject: [PATCH 211/321] update mag config params

---
 bu_isciii/templates/mag/DOC/mag.config | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/mag/DOC/mag.config b/bu_isciii/templates/mag/DOC/mag.config
index 86327ddcc..a61f7686e 100644
--- a/bu_isciii/templates/mag/DOC/mag.config
+++ b/bu_isciii/templates/mag/DOC/mag.config
@@ -19,7 +19,7 @@ process {
 	withName:'SPADES|MEGAHIT' {
 		errorStrategy = { task.exitStatus in [143,137,21,1] ? 'retry' : 'finish' }
         maxRetries    = 2
-		cpus = { 16 * task.attempt }
+		cpus = { 10 * task.attempt }
 		memory = { 64.GB * task.attempt }
 		time = { 24.h }
 	}
@@ -31,7 +31,7 @@ process {
 	withName:'CONCOCT_CONCOCT' {
 		errorStrategy = { task.exitStatus in [140] ? 'retry' : 'finish' }
 		maxRetries = 2
-		cpus = { 12 * task.attempt }
+		cpus = { 8 * task.attempt }
 		memory = { 64.GB * task.attempt }
 		time = { 12.h * task.attempt }
 	}
@@ -42,6 +42,9 @@ process {
                 memory = { 32.GB * task.attempt }
                 time = { 4.h * task.attempt }
 	}
+	withName:'BOWTIE2_PHIX_REMOVAL_BUILD'{
+		time = 12.h
+	}
 }
 
 params {

From 72721a95d9ed4bde0dd9fb1b7ea9183a0edf892b Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Thu, 22 Aug 2024 15:50:52 +0200
Subject: [PATCH 212/321] fix lablog in mag_tax

---
 bu_isciii/templates/mag/ANALYSIS/lablog_mag_taxonomics | 2 +-
 bu_isciii/templates/mag/RESULTS/lablog_mag_results     | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/mag/ANALYSIS/lablog_mag_taxonomics b/bu_isciii/templates/mag/ANALYSIS/lablog_mag_taxonomics
index 5076f4425..72d7d463c 100644
--- a/bu_isciii/templates/mag/ANALYSIS/lablog_mag_taxonomics
+++ b/bu_isciii/templates/mag/ANALYSIS/lablog_mag_taxonomics
@@ -1 +1 @@
-mv ANALYSIS02_MAG $(date '+%Y%m%d')_ANALYSIS02_MAG
+mv ANALYSIS02_MAG_TAXONOMICS $(date '+%Y%m%d')_ANALYSIS02_MAG_TAXONOMICS
diff --git a/bu_isciii/templates/mag/RESULTS/lablog_mag_results b/bu_isciii/templates/mag/RESULTS/lablog_mag_results
index 55bc4c0e5..11667ce47 100755
--- a/bu_isciii/templates/mag/RESULTS/lablog_mag_results
+++ b/bu_isciii/templates/mag/RESULTS/lablog_mag_results
@@ -3,4 +3,4 @@ cd $(date '+%Y%m%d')_entrega01
 
 #Create symbolic links depending on the analysis
 #Individual files
-ln -s ../../ANALYSIS/*_MAG/99-stats/multiqc_report.html ./krona_results.html
+ln -s ../../ANALYSIS/*_ANALYSIS02_MAG_TAXONOMICS/99-stats/multiqc_report.html ./krona_results.html

From 092ee8fcb7f8b41b634e0d32fe9d391c631bdd70 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Fri, 23 Aug 2024 12:11:13 +0200
Subject: [PATCH 213/321] minor config update

---
 bu_isciii/templates/mag/DOC/mag.config | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/mag/DOC/mag.config b/bu_isciii/templates/mag/DOC/mag.config
index a61f7686e..f6e3c8b2c 100644
--- a/bu_isciii/templates/mag/DOC/mag.config
+++ b/bu_isciii/templates/mag/DOC/mag.config
@@ -17,7 +17,7 @@ process {
 	errorStrategy   = { task.exitStatus in ((130..145) + 104) ? 'retry' : 'finish' }
 
 	withName:'SPADES|MEGAHIT' {
-		errorStrategy = { task.exitStatus in [143,137,21,1] ? 'retry' : 'finish' }
+		errorStrategy = { task.exitStatus in [143,137,21,12,1] ? 'retry' : 'finish' }
         maxRetries    = 2
 		cpus = { 10 * task.attempt }
 		memory = { 64.GB * task.attempt }

From d1506ac2fcfde9576e46a2ed285d9278ed8adae9 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Fri, 23 Aug 2024 16:35:47 +0200
Subject: [PATCH 214/321] update changelog #321

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 42f918ab2..e988773d5 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -65,6 +65,7 @@ Code contributions to the new version:
 - Added scripts for time series RNAseq and updated differential expression code for differentially expressed transcripts [#316](https://github.com/BU-ISCIII/buisciii-tools/pull/316).
 - Added bbaladron to SFTP users [#316](https://github.com/BU-ISCIII/buisciii-tools/pull/316).
 - Added new template for comprehensive taxonomy profiling using the nf-core/taxprofiler pipeline [#320](https://github.com/BU-ISCIII/buisciii-tools/pull/320).
+- Added full execution support for the MAG template [#321](https://github.com/BU-ISCIII/buisciii-tools/pull/321).
 
 ### Modules
 

From 73893ddd5520cb5249624406607acd757e0b5f33 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Fri, 23 Aug 2024 16:42:44 +0200
Subject: [PATCH 215/321] dummy changes

---
 bu_isciii/templates/mag/ANALYSIS/lablog_mag_all | 2 +-
 bu_isciii/templates/mag/DOC/mag.config          | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/mag/ANALYSIS/lablog_mag_all b/bu_isciii/templates/mag/ANALYSIS/lablog_mag_all
index 68cd3b09f..a6e0982eb 100644
--- a/bu_isciii/templates/mag/ANALYSIS/lablog_mag_all
+++ b/bu_isciii/templates/mag/ANALYSIS/lablog_mag_all
@@ -2,4 +2,4 @@ mkdir 00-reads
 cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R1*.fastq.gz %_R1.fastq.gz" | bash; cd -
 cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R2*.fastq.gz %_R2.fastq.gz" | bash; cd -
 
-mv ANALYSIS01_MAG_ALL $(date '+%Y%m%d')_ANALYSIS01_MAG_ALL
\ No newline at end of file
+mv ANALYSIS01_MAG_ALL $(date '+%Y%m%d')_ANALYSIS01_MAG_ALL
diff --git a/bu_isciii/templates/mag/DOC/mag.config b/bu_isciii/templates/mag/DOC/mag.config
index f6e3c8b2c..3a70811d8 100644
--- a/bu_isciii/templates/mag/DOC/mag.config
+++ b/bu_isciii/templates/mag/DOC/mag.config
@@ -18,7 +18,7 @@ process {
 
 	withName:'SPADES|MEGAHIT' {
 		errorStrategy = { task.exitStatus in [143,137,21,12,1] ? 'retry' : 'finish' }
-        maxRetries    = 2
+		maxRetries    = 2
 		cpus = { 10 * task.attempt }
 		memory = { 64.GB * task.attempt }
 		time = { 24.h }

From f46ea4d758cbe0c710ad278e17fd23cfd7968a04 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Tue, 3 Sep 2024 13:51:37 +0200
Subject: [PATCH 216/321] created tempalte for mag_all

---
 .../lablog                                    | 10 ++++-----
 .../templates/mag/ANALYSIS/lablog_mag_all     |  2 +-
 bu_isciii/templates/mag/DOC/mag.config        | 22 ++++++++++++++++++-
 .../mag/RESULTS/lablog_mag_all_results        |  6 +++++
 ..._results => lablog_mag_taxonomics_results} |  0
 5 files changed, 33 insertions(+), 7 deletions(-)
 rename bu_isciii/templates/mag/ANALYSIS/{ANALYSIS01_MAG_ALL => ANALYSIS03_MAG_ALL}/lablog (80%)
 create mode 100644 bu_isciii/templates/mag/RESULTS/lablog_mag_all_results
 rename bu_isciii/templates/mag/RESULTS/{lablog_mag_results => lablog_mag_taxonomics_results} (100%)

diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_MAG_ALL/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
similarity index 80%
rename from bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_MAG_ALL/lablog
rename to bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
index 341c46c38..142680656 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_MAG_ALL/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
@@ -11,14 +11,14 @@ done >> samplesheet.csv
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
 
-cat <<EOF > mag_complete.sbatch
+cat <<EOF > mag_all.sbatch
 #!/bin/sh
 #SBATCH --ntasks 1
 #SBATCH --cpus-per-task 2
 #SBATCH --mem 8G
-#SBATCH --time 120:00:00
+#SBATCH --time 72:00:00
 #SBATCH --partition long_idx
-#SBATCH --output $(date '+%Y%m%d')_mag_complete.log
+#SBATCH --output $(date '+%Y%m%d')_mag_all.log
 #SBATCH --chdir $scratch_dir
 
 # module load Nextflow/23.10.0 singularity
@@ -30,8 +30,8 @@ nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-2.5.3/workflow/main.nf \
     --input samplesheet.csv \\
     --kraken2_db '/data/bi/references/kraken/minikraken_8GB_20200312.tgz' \\
     --skip_spadeshybrid true \\
-    --outdir $(date '+%Y%m%d')_mag_complete \\
+    --outdir $(date '+%Y%m%d')_mag_all \\
     -resume
 EOF
 
-echo "sbatch mag_complete.sbatch" > _01_run_mag_complete.sh
+echo "sbatch mag_all.sbatch" > _01_run_mag_all.sh
diff --git a/bu_isciii/templates/mag/ANALYSIS/lablog_mag_all b/bu_isciii/templates/mag/ANALYSIS/lablog_mag_all
index a6e0982eb..caa07af92 100644
--- a/bu_isciii/templates/mag/ANALYSIS/lablog_mag_all
+++ b/bu_isciii/templates/mag/ANALYSIS/lablog_mag_all
@@ -2,4 +2,4 @@ mkdir 00-reads
 cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R1*.fastq.gz %_R1.fastq.gz" | bash; cd -
 cd 00-reads; cat ../samples_id.txt | xargs -I % echo "ln -s ../../RAW/%_*R2*.fastq.gz %_R2.fastq.gz" | bash; cd -
 
-mv ANALYSIS01_MAG_ALL $(date '+%Y%m%d')_ANALYSIS01_MAG_ALL
+mv ANALYSIS03_MAG_ALL $(date '+%Y%m%d')_ANALYSIS03_MAG_ALL
diff --git a/bu_isciii/templates/mag/DOC/mag.config b/bu_isciii/templates/mag/DOC/mag.config
index 3a70811d8..05678359e 100644
--- a/bu_isciii/templates/mag/DOC/mag.config
+++ b/bu_isciii/templates/mag/DOC/mag.config
@@ -43,7 +43,7 @@ process {
                 time = { 4.h * task.attempt }
 	}
 	withName:'BOWTIE2_PHIX_REMOVAL_BUILD'{
-		time = 12.h
+		time = 18.h
 	}
 }
 
@@ -52,3 +52,23 @@ params {
 	max_cpus = 32
 	max_time = '48.h'
 }
+
+/*
+    CUSTOM OUTPUT FOLDER STRUCTURE -- modules.config
+*/
+params { publish_dir_mode = 'copy' }
+process {
+	withName: 'MULTIQC' {
+        publishDir = [
+            path: { "${params.outdir}/99-stats" },
+            mode: params.publish_dir_mode,
+            saveAs: { filename -> 
+				if (filename.equals('versions.yml') || filename.endsWith('.csv')) {
+                    null
+				} else {
+					filename
+                }
+            }
+		]
+	}
+}
diff --git a/bu_isciii/templates/mag/RESULTS/lablog_mag_all_results b/bu_isciii/templates/mag/RESULTS/lablog_mag_all_results
new file mode 100644
index 000000000..698a21e7e
--- /dev/null
+++ b/bu_isciii/templates/mag/RESULTS/lablog_mag_all_results
@@ -0,0 +1,6 @@
+mkdir $(date '+%Y%m%d')_entrega01
+cd $(date '+%Y%m%d')_entrega01
+
+#Create symbolic links depending on the analysis
+#Individual files
+ln -s ../../ANALYSIS/*_ANALYSIS03_MAG_ALL/99-stats/multiqc_report.html ./krona_results.html
\ No newline at end of file
diff --git a/bu_isciii/templates/mag/RESULTS/lablog_mag_results b/bu_isciii/templates/mag/RESULTS/lablog_mag_taxonomics_results
similarity index 100%
rename from bu_isciii/templates/mag/RESULTS/lablog_mag_results
rename to bu_isciii/templates/mag/RESULTS/lablog_mag_taxonomics_results

From b67f886e85322c670c4ca2b71c25638adf96d800 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Thu, 5 Sep 2024 11:06:23 +0200
Subject: [PATCH 217/321] increase timelimit to mag module and add todo

---
 bu_isciii/templates/mag/DOC/mag.config | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/mag/DOC/mag.config b/bu_isciii/templates/mag/DOC/mag.config
index 05678359e..837c8dfe6 100644
--- a/bu_isciii/templates/mag/DOC/mag.config
+++ b/bu_isciii/templates/mag/DOC/mag.config
@@ -28,12 +28,13 @@ process {
 		errorStrategy = { task.exitStatus in [ 1, 255 ] ? 'ignore' : 'retry' }
 		time          = { 8.h * task.attempt }
 	}
+	// TODO: This bining tool takes ~24h to finish... Consider skipping it.  
 	withName:'CONCOCT_CONCOCT' {
 		errorStrategy = { task.exitStatus in [140] ? 'retry' : 'finish' }
 		maxRetries = 2
 		cpus = { 8 * task.attempt }
 		memory = { 64.GB * task.attempt }
-		time = { 12.h * task.attempt }
+		time = { 24.h * task.attempt }
 	}
 	withName:'CHECKM_LINEAGEWF' {
 		errorStrategy = { task.exitStatus in [1] ? 'retry' : 'finish' }

From 0f1f4ace148c25f09cb63a59eec7139181e6edb8 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Thu, 5 Sep 2024 11:13:27 +0200
Subject: [PATCH 218/321] add mag_all results lablog and documentation

---
 bu_isciii/assets/reports/results/mag.md       | 12 ++++++--
 .../mag/RESULTS/lablog_mag_all_results        | 29 +++++++++++++++----
 2 files changed, 34 insertions(+), 7 deletions(-)

diff --git a/bu_isciii/assets/reports/results/mag.md b/bu_isciii/assets/reports/results/mag.md
index fa6ea6cb7..ce9685141 100644
--- a/bu_isciii/assets/reports/results/mag.md
+++ b/bu_isciii/assets/reports/results/mag.md
@@ -2,17 +2,25 @@
 
 Here we describe the results from the MAG pipeline for multispecies metagenomic analysis.
 
+### MAG - TAXONIMIC ANALYSIS
+
 * `krona_results.html`​ : Final HTML report with the top 5 species most present in all samples.
 
 > [!WARNING]
 > Software's versions used in this analysis can be obtained from the  `MultiQC` report.
 
+### MAG - COMPLETE ANALYSIS
+
+* `mag_all/krona/${sample_name}.${tool}.report.html`: A Krona interactive visualization report for the each sample based on Kraken2 (or other) taxonomic classification mehtod.
+* `mag_all/quast/${sample_name}.${tool}.report.html`: A Quast report for the assembly quality control of each sample assembled using MEGAHIT, SPAdes or other.
+* `mag_all/multiqc_report.html`: A combined report generated by MultiQC summarizing various quality control results for all samples.
+
 ## Taxprofiler
 
 Here we describe the results from the (nf-core/taxprofiler)[https://nf-co.re/taxprofiler/1.1.8] pipeline for multispecies taxonomic classification and profiling of shorgun short- and long-read.
 
-* `multiqc_report.html​`: Final HTML report collecting numerical stats from each module executed in this pipeline.
-* `krona/database_*.html`: Interactive HTML files generated by Krona, displaying the results of taxonomic classification for supported tools (Kraken2, Centrifuge, Kaiju, and MALT)
+* `taxprofiler/multiqc_report.html​`: Final HTML report collecting numerical stats from each module executed in this pipeline.
+* `taxprofiler/krona/database_*.html`: Interactive HTML files generated by Krona, displaying the results of taxonomic classification for supported tools (Kraken2, Centrifuge, Kaiju, and MALT)
 
 > [!WARNING]
 > Software's versions used in this analysis can be obtained from the  `MultiQC` report.
\ No newline at end of file
diff --git a/bu_isciii/templates/mag/RESULTS/lablog_mag_all_results b/bu_isciii/templates/mag/RESULTS/lablog_mag_all_results
index 698a21e7e..f467632eb 100644
--- a/bu_isciii/templates/mag/RESULTS/lablog_mag_all_results
+++ b/bu_isciii/templates/mag/RESULTS/lablog_mag_all_results
@@ -1,6 +1,25 @@
-mkdir $(date '+%Y%m%d')_entrega01
-cd $(date '+%Y%m%d')_entrega01
+DELIVERY_FOLDER="$(date '+%Y%m%d')_entrega01"
+mkdir -p $DELIVERY_FOLDER/mag_all
 
-#Create symbolic links depending on the analysis
-#Individual files
-ln -s ../../ANALYSIS/*_ANALYSIS03_MAG_ALL/99-stats/multiqc_report.html ./krona_results.html
\ No newline at end of file
+# Taxprofiling service
+cd $DELIVERY_FOLDER/mag_all
+ANALYSIS_FOLDER=../../../ANALYSIS/*_ANALYSIS03_MAG_ALL/*_mag_all
+
+# multiqc report
+ln -s ${ANALYSIS_FOLDER}/99-stats/multiqc_report.html .
+
+# quast reports
+mkdir -p quast
+for quast_report in ${ANALYSIS_FOLDER}/Assembly/*/QC/*/QUAST/report.html; do
+    assembly_tool=$(echo "$quast_report" | awk -F'/' '{print $8}')
+    sample_name=$(echo "$quast_report" | awk -F'/' '{print $10}')
+    ln -s "../$quast_report" "quast/${sample_name}.${assembly_tool}.report.html"
+done
+
+# krona reports
+mkdir -p krona
+for krona_report in ${ANALYSIS_FOLDER}/Taxonomy/*/*/taxonomy.krona.html; do
+    taxonomy_tool=$(echo "$krona_report" | awk -F'/' '{print $8}')
+    sample_name=$(echo "$krona_report" | awk -F'/' '{print $9}')
+    ln -s "../$krona_report" "krona/${sample_name}.${taxonomy_tool}.report.html"
+done
\ No newline at end of file

From 34a852dd732ad01b14f1d925ae3f70088a076b56 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Thu, 5 Sep 2024 11:13:51 +0200
Subject: [PATCH 219/321] allow step for refinement

---
 bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
index 142680656..55e064df7 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
@@ -30,6 +30,7 @@ nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-2.5.3/workflow/main.nf \
     --input samplesheet.csv \\
     --kraken2_db '/data/bi/references/kraken/minikraken_8GB_20200312.tgz' \\
     --skip_spadeshybrid true \\
+    --refine_bins_dastool true \\
     --outdir $(date '+%Y%m%d')_mag_all \\
     -resume
 EOF

From 730ed93aa44863972c3ae316bb0aaec8f1bb2c72 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Thu, 5 Sep 2024 12:07:30 +0200
Subject: [PATCH 220/321] skip concoct due to excess in timelimt

---
 .../mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog       |  1 +
 bu_isciii/templates/mag/DOC/mag.config           | 16 ++++++++--------
 2 files changed, 9 insertions(+), 8 deletions(-)

diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
index 55e064df7..46875ca53 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
@@ -30,6 +30,7 @@ nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-2.5.3/workflow/main.nf \
     --input samplesheet.csv \\
     --kraken2_db '/data/bi/references/kraken/minikraken_8GB_20200312.tgz' \\
     --skip_spadeshybrid true \\
+    --skip_concoct true \\
     --refine_bins_dastool true \\
     --outdir $(date '+%Y%m%d')_mag_all \\
     -resume
diff --git a/bu_isciii/templates/mag/DOC/mag.config b/bu_isciii/templates/mag/DOC/mag.config
index 837c8dfe6..5f8420a97 100644
--- a/bu_isciii/templates/mag/DOC/mag.config
+++ b/bu_isciii/templates/mag/DOC/mag.config
@@ -28,14 +28,14 @@ process {
 		errorStrategy = { task.exitStatus in [ 1, 255 ] ? 'ignore' : 'retry' }
 		time          = { 8.h * task.attempt }
 	}
-	// TODO: This bining tool takes ~24h to finish... Consider skipping it.  
-	withName:'CONCOCT_CONCOCT' {
-		errorStrategy = { task.exitStatus in [140] ? 'retry' : 'finish' }
-		maxRetries = 2
-		cpus = { 8 * task.attempt }
-		memory = { 64.GB * task.attempt }
-		time = { 24.h * task.attempt }
-	}
+	// TODO: This bining tool takes ~24h to finish... skip was added in lablog, however it can be enabeled.
+	// withName:'CONCOCT_CONCOCT' {
+	// 	errorStrategy = { task.exitStatus in [140] ? 'retry' : 'finish' }
+	// 	maxRetries = 2
+	// 	cpus = { 8 * task.attempt }
+	// 	memory = { 64.GB * task.attempt }
+	// 	time = { 24.h * task.attempt }
+	// }
 	withName:'CHECKM_LINEAGEWF' {
 		errorStrategy = { task.exitStatus in [1] ? 'retry' : 'finish' }
                 maxRetries = 3

From 3b0a8e8fea74acc04e32f5efbe95dd20dba2c5c0 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Thu, 5 Sep 2024 12:17:26 +0200
Subject: [PATCH 221/321] update readme in #321

---
 bu_isciii/templates/services.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/services.json b/bu_isciii/templates/services.json
index 44b5f5b68..3aea8fce3 100755
--- a/bu_isciii/templates/services.json
+++ b/bu_isciii/templates/services.json
@@ -210,7 +210,7 @@
       "begin": "base",
       "end": "",
       "url": "https://github.com/nf-core/mag or https://github.com/nf-core/taxprofiler",
-      "description": "1- Bioinformatics best-practise analysis for taxonomic classification and profiling; 2- Bioinformatics best-practise analysis pipeline for assembly, binning and annotation of metagenomes.",
+      "description": "1- Bioinformatics best-practise analysis for taxonomic classification and/or genome binning; 2- Bioinformatics best-practise analysis pipeline for assembly, binning and annotation of metagenomes.",
       "clean": {
         "folders":[],
         "files":[]

From 7452159f12fd3194160dca5c7e90cff8a4ae3290 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Fri, 6 Sep 2024 11:53:54 +0200
Subject: [PATCH 222/321] Added several changes in bioinfo_doc.py to allow the
 inclusion of versions.yml in the pdf associated with the service delivery

---
 bu_isciii/bioinfo_doc.py | 32 ++++++++++++++++++++++++++++++--
 1 file changed, 30 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index 37512a40e..94a6c2c33 100755
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -11,6 +11,7 @@
 import markdown
 import pdfkit
 import PyPDF2
+import yaml
 import subprocess
 import json
 import shutil
@@ -77,7 +78,7 @@ def __init__(
             conf_api["server"], conf_api["api_url"], api_user, api_password
         )
         self.resolution_info = self.rest_api.get_request(
-            request_info="service-data", safe=True, resolution=self.resolution_id
+            request_info="service-data", safe=False, resolution=self.resolution_id
         )
         if self.resolution_info == 404:
             print("Received Error 404 from Iskylims API. Aborting")
@@ -92,7 +93,7 @@ def __init__(
             else:
                 self.post_delivery_info()
         self.resolution_info = self.rest_api.get_request(
-            request_info="service-data", safe=True, resolution=self.resolution_id
+            request_info="service-data", safe=False, resolution=self.resolution_id
         )
         self.services_requested = self.resolution_info["resolutions"][0][
             "available_services"
@@ -184,6 +185,7 @@ def __init__(
             self.path, self.conf["services_path"], year, self.service_name
         )
         self.samples = self.resolution_info.get("samples", None)
+        self.versions = self.load_versions()
         self.handled_services = None
         try:
             self.config_pdfkit = pdfkit.configuration()
@@ -206,6 +208,30 @@ def __init__(
         else:
             self.email_psswd = email_psswd
 
+        if self.type == "delivery":
+            service_list = {}
+            for service_id_requested in self.service_ids_requested_list:
+                service_list[service_id_requested] = bu_isciii.service_json.ServiceJson().get_find(service_id_requested, "label")
+            self.all_services = service_list 
+
+    def load_versions(self):
+        """Load and parse the versions.yml file."""
+        result = subprocess.run(f"find /data/bi/services_and_colaborations/*/*/{self.service_name} -name '*versions.yml'", stdout=subprocess.PIPE, text=True, shell=True)
+        versions_files = result.stdout.strip().split("\n")
+        if versions_files == [""]:
+            stderr.print(f"[red] No versions.yml files found for the service {self.service_name}!")
+            return "No software versions data available for this service"
+        else:
+            versions_data = {}
+            loaded_contents = []
+            for versions_file in versions_files:
+                with open(versions_file, 'r') as f:
+                    content = yaml.safe_load(f)
+                if content not in loaded_contents:
+                    versions_data[versions_file] = content
+                    loaded_contents.append(content)
+            return versions_data
+
     def create_structure(self):
         if os.path.exists(self.service_folder):
             log.info("Already creted the service folder for %s", self.service_folder)
@@ -332,6 +358,8 @@ def create_markdown(self, file_path):
         # service related information
         markdown_data["service"] = self.resolution_info
         markdown_data["user_data"] = self.resolution_info["service_user_id"]
+        markdown_data["software_versions"] = self.versions
+        markdown_data["services_list"] = self.all_services
         samples_in_service = {}
 
         if self.samples is not None:

From 1bea0ec53d75d03122a05d0272608f3e28755cca Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Fri, 6 Sep 2024 11:55:17 +0200
Subject: [PATCH 223/321] Added a software versions section in the jinja
 delivery template

---
 .../templates/jinja_template_delivery.j2      | 42 +++++++++++++++++--
 1 file changed, 39 insertions(+), 3 deletions(-)

diff --git a/bu_isciii/templates/jinja_template_delivery.j2 b/bu_isciii/templates/jinja_template_delivery.j2
index b55828d3e..058b07901 100644
--- a/bu_isciii/templates/jinja_template_delivery.j2
+++ b/bu_isciii/templates/jinja_template_delivery.j2
@@ -74,9 +74,8 @@ Here we describe information about the resolution delivery.
 {% endif %}
 
 {% if samples %}
-## Samples sequenced at iSCIII:
-
-Here we describe information about the project associated to the service:
+## Samples sequenced at ISCIII:
+##Here we describe information about the project associated to the service:
 {% if service_sequencing_center -%} * Sequencing center: {{ service_sequencing_center }}{% endif %}
 {% for run , projects in samples.items() %}
 * Run name: {{ run }}
@@ -88,6 +87,43 @@ Here we describe information about the project associated to the service:
 {% endfor %}
 {% endif %}
 
+<style>
+    .page-break { page-break-before: always; }
+</style>
+
+<div class="page-break"></div>
+
+## Software versions:
+
+{% if services_list is mapping and software_versions is mapping %}
+{%- set service_list = services_list.items() | list %}
+{%- set file_version_list = software_versions.items() | list %}
+
+{%- for index in range(service_list | length) %}
+  {%- if index < file_version_list | length %}
+    {%- set service_id, description = service_list[index] %}
+* <b>{{ description }} ({{ service_id }})</b>:
+    {%- set file_path, processes = file_version_list[index] %}
+    {%- if processes | length > 0 %}
+      {%- for process, tools in processes.items() %}
+    - {{ process }}:
+          {%- for tool, version in tools.items() %}
+        - {{ tool }}: {{ version }}
+          {%- endfor %}
+      {%- endfor %}
+    {%- else %}
+    - No software versions data available for this file path.
+    {%- endif %}
+  {%- else %}
+    {%- set service_id, description = service_list[index] %}
+* <b>{{ description }} ({{ service_id }})</b>:
+    - No software versions data available for this service.
+  {%- endif %}
+{%- endfor %}
+{% else %}
+No software versions data available for this service.
+{% endif %}
+
 <!---
 ### TODO
 ### External Samples

From b426298b76e813aa24cec77f73c2a8fd14f7e3cb Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Fri, 6 Sep 2024 11:55:44 +0200
Subject: [PATCH 224/321] Added the labels for each service in services.json

---
 bu_isciii/templates/services.json | 32 +++++++++++++++----------------
 1 file changed, 16 insertions(+), 16 deletions(-)

diff --git a/bu_isciii/templates/services.json b/bu_isciii/templates/services.json
index 3aea8fce3..ca5512f4b 100755
--- a/bu_isciii/templates/services.json
+++ b/bu_isciii/templates/services.json
@@ -1,6 +1,6 @@
 {
     "assembly_annotation": {
-        "label": "",
+        "label": "Bacteria: De novo genome assembly and annotation",
         "template": "assembly",
         "url": "https://github.com/nf-core/bacass/tree/2.3.1",
         "order": 1,
@@ -17,7 +17,7 @@
         "results_md": "assets/reports/results/assembly.md"
     },
     "mtbseq": {
-        "label": "",
+        "label": "Bacteria: In-depth analysis of Mycobacterium species genomes (e.g. M. tuberculosis. M. bovis)",
         "template": "mtbseq",
         "order": 1,
         "begin": "base",
@@ -34,7 +34,7 @@
         "results_md": ""
     },
     "pikavirus": {
-      "label": "",
+      "label": "Viral: Detection and characterization of viral genomes within metagenomic data",
       "template": "pikavirus",
       "order": 1,
       "begin": "base",
@@ -51,7 +51,7 @@
       "results_md": "assets/reports/results/pikavirus.md"
   },
     "plasmidid_assembly": {
-      "label": "",
+      "label": "Bacteria: Plasmid analysis and characterization",
       "template": "plasmidid",
       "order": 1,
       "begin": "base",
@@ -85,7 +85,7 @@
         "results_md": ""
     },
     "wgmlst_chewbbaca": {
-        "label": "",
+        "label": "Bacteria: Core genome or whole genome Multi-Locus Sequence Typing analysis (cg/wgMLST)",
         "template": "chewbbaca",
         "order": 1,
         "begin": "base",
@@ -103,7 +103,7 @@
         "results_md": "assets/reports/results/wgmlst_chewbbaca.md"
     },
     "viralrecon": {
-        "label": "",
+        "label": "Viral: Genomic reconstruction, reference mapping and variant calling and/or de novo assembly",
         "template": "viralrecon",
         "url": "https://github.com/BU-ISCIII/viralrecon",
         "order": 1,
@@ -137,7 +137,7 @@
         "results_md": "assets/reports/results/rnaseq_deg.md"
     },
     "lowfreq_panel": {
-        "label": "",
+        "label": "Low-frequency variants detection and annotation for whole genome or sequencing panel (e.g. retinoblastoma gene panel)",
         "template": "lowfreq_panel",
         "url": "",
         "order": 1,
@@ -154,7 +154,7 @@
         "results_md": ""
     },
     "snippy": {
-      "label": "",
+      "label": "Fungal / bacteria / virus : Variant calling, annotation and SNP-based outbreak analysis (e.g. haploid fungal outbreak)",
       "template": "snippy",
       "order": 1,
       "begin": "base",
@@ -187,7 +187,7 @@
       "delivery_pdf": ""
     },
     "characterization": {
-      "label": "",
+      "label": "Bacteria: Multi-Locus Sequence Typing (MLST), analysis of virulence factors, antimicrobial resistance, and plasmids characterization",
       "template": "characterization",
       "url": "",
       "order": 1,
@@ -204,7 +204,7 @@
       "results_md": ""
     },
     "mag_met": {
-      "label": "",
+      "label": "Taxonomic based Identification and classification of organisms in complex communities",
       "template": "mag",
       "order": 2,
       "begin": "base",
@@ -221,7 +221,7 @@
       "results_md": "assets/reports/results/mag.md"
     },
     "exometrio": {
-      "label": "",
+      "label": "Human: Exome sequencing for variant calling, annotation and inheritance filtering (e.g. Exome sequencing of a human trio (two parents and one child))",
       "template": "exometrio",
       "url": "",
       "order": 1,
@@ -238,7 +238,7 @@
       "results_md": "assets/reports/results/trios.md"
     },
     "exomeeb": {
-      "label": "",
+      "label": "Eukaria: Variant calling and annotation for a sequencing panel (e.g. epidermolysis gene panel, mouse or rat gene panel)",
       "template": "exomeeb",
       "url": "",
       "order": 1,
@@ -255,7 +255,7 @@
       "results_md": "assets/reports/results/exomeeb.md"
     },
     "wgstrio": {
-      "label": "",
+      "label": "Human: Whole genome sequencing for SNPs variant calling, annotation and inheritance filtering (e.g.WGS of a human trio )",
       "template": "wgstrio",
       "url": "",
       "order": 1,
@@ -272,7 +272,7 @@
       "results_md": "assets/reports/results/trios.md"
     },
     "freebayes_outbreak": {
-      "label": "",
+      "label": "Eukaria (non-human): Variant calling, annotation and SNP-based outbreak analysis (e.g. diploid fungal outbreak)",
       "template": "freebayes_outbreak",
       "url": "",
       "order": 1,
@@ -289,7 +289,7 @@
       "results_md": ""
     },
     "IRMA": {
-      "label": "",
+      "label": "Viral Flu: Influenza fragment reconstruction and variant detection",
       "template": "IRMA",
       "url": "",
       "order": 1,
@@ -306,7 +306,7 @@
       "results_md": "assets/reports/results/irma_output.md"
     },
     "blast_nt": {
-      "label": "",
+      "label": "Alignment of de novo assembly contigs to database",
       "template": "blast_nt",
       "url": "",
       "order": 1,

From cc3e7ad3192a3f5c10d8faf1ac2a9c68b0d03748 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Fri, 6 Sep 2024 13:06:04 +0200
Subject: [PATCH 225/321] Changed safe from False to True

---
 bu_isciii/bioinfo_doc.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index 94a6c2c33..edced08ed 100755
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -78,7 +78,7 @@ def __init__(
             conf_api["server"], conf_api["api_url"], api_user, api_password
         )
         self.resolution_info = self.rest_api.get_request(
-            request_info="service-data", safe=False, resolution=self.resolution_id
+            request_info="service-data", safe=True, resolution=self.resolution_id
         )
         if self.resolution_info == 404:
             print("Received Error 404 from Iskylims API. Aborting")
@@ -93,7 +93,7 @@ def __init__(
             else:
                 self.post_delivery_info()
         self.resolution_info = self.rest_api.get_request(
-            request_info="service-data", safe=False, resolution=self.resolution_id
+            request_info="service-data", safe=True, resolution=self.resolution_id
         )
         self.services_requested = self.resolution_info["resolutions"][0][
             "available_services"

From 429ad72059cabab06a8bec2bc7d4713d1288bf17 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Fri, 6 Sep 2024 13:11:18 +0200
Subject: [PATCH 226/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index e988773d5..c4343a4cb 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -66,6 +66,7 @@ Code contributions to the new version:
 - Added bbaladron to SFTP users [#316](https://github.com/BU-ISCIII/buisciii-tools/pull/316).
 - Added new template for comprehensive taxonomy profiling using the nf-core/taxprofiler pipeline [#320](https://github.com/BU-ISCIII/buisciii-tools/pull/320).
 - Added full execution support for the MAG template [#321](https://github.com/BU-ISCIII/buisciii-tools/pull/321).
+- Added labels to services.json and updated bioinfo_doc.py and jinja_template_delivery.j2 so that software versions data is displayed in the delivery pdf [#330](https://github.com/BU-ISCIII/buisciii-tools/pull/330).
 
 ### Modules
 

From 34f0ab7674c2193761de2d536c96c81f51f75b66 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Fri, 6 Sep 2024 13:14:10 +0200
Subject: [PATCH 227/321] Removed trailing whitespace

---
 bu_isciii/bioinfo_doc.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index edced08ed..6bcf4f582 100755
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -212,7 +212,7 @@ def __init__(
             service_list = {}
             for service_id_requested in self.service_ids_requested_list:
                 service_list[service_id_requested] = bu_isciii.service_json.ServiceJson().get_find(service_id_requested, "label")
-            self.all_services = service_list 
+            self.all_services = service_list
 
     def load_versions(self):
         """Load and parse the versions.yml file."""

From 0e57696d69171702df95e51e6a4fbd6c66db6b3e Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Fri, 6 Sep 2024 13:21:13 +0200
Subject: [PATCH 228/321] Ran black on bioinfo_doc.py

---
 bu_isciii/bioinfo_doc.py | 19 +++++++++++++++----
 1 file changed, 15 insertions(+), 4 deletions(-)

diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index 6bcf4f582..7852c423c 100755
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -211,21 +211,32 @@ def __init__(
         if self.type == "delivery":
             service_list = {}
             for service_id_requested in self.service_ids_requested_list:
-                service_list[service_id_requested] = bu_isciii.service_json.ServiceJson().get_find(service_id_requested, "label")
+                service_list[
+                    service_id_requested
+                ] = bu_isciii.service_json.ServiceJson().get_find(
+                    service_id_requested, "label"
+                )
             self.all_services = service_list
 
     def load_versions(self):
         """Load and parse the versions.yml file."""
-        result = subprocess.run(f"find /data/bi/services_and_colaborations/*/*/{self.service_name} -name '*versions.yml'", stdout=subprocess.PIPE, text=True, shell=True)
+        result = subprocess.run(
+            f"find /data/bi/services_and_colaborations/*/*/{self.service_name} -name '*versions.yml'",
+            stdout=subprocess.PIPE,
+            text=True,
+            shell=True,
+        )
         versions_files = result.stdout.strip().split("\n")
         if versions_files == [""]:
-            stderr.print(f"[red] No versions.yml files found for the service {self.service_name}!")
+            stderr.print(
+                f"[red] No versions.yml files found for the service {self.service_name}!"
+            )
             return "No software versions data available for this service"
         else:
             versions_data = {}
             loaded_contents = []
             for versions_file in versions_files:
-                with open(versions_file, 'r') as f:
+                with open(versions_file, "r") as f:
                     content = yaml.safe_load(f)
                 if content not in loaded_contents:
                     versions_data[versions_file] = content

From 571083955aa4de704dfdefdc13f1087569bb6341 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 9 Sep 2024 10:28:39 +0200
Subject: [PATCH 229/321] Created a new config file for viralrecon to keep
 relevant kraken files

---
 .../DOC/viralrecon_no_host_reads.config       | 35 +++++++++++++++++++
 1 file changed, 35 insertions(+)
 create mode 100644 bu_isciii/templates/viralrecon/DOC/viralrecon_no_host_reads.config

diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon_no_host_reads.config b/bu_isciii/templates/viralrecon/DOC/viralrecon_no_host_reads.config
new file mode 100644
index 000000000..7bc082ef8
--- /dev/null
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon_no_host_reads.config
@@ -0,0 +1,35 @@
+singularity {
+        enabled = true
+        autoMounts = true
+        runOptions = '-B /data/bi/references/ -B "$HOME"'
+}
+
+process {
+        executor = 'slurm'
+        queue = 'middle_idx'
+        withName: 'FASTP' {
+            ext.args = '--cut_front --cut_tail --trim_poly_x --cut_mean_quality 20 --qualified_quality_phred 20 --unqualified_percent_limit 10 --length_required 50'
+        }
+        withName: 'PANGOLIN' {
+            ext.args = '--datadir XXXX'
+            container = 'https://depot.galaxyproject.org/singularity/pangolin:4.3--pyhdfd78af_2'
+        }
+        withName: 'NEXTCLADE_DATASETGET|NEXTCLADE_RUN' {
+        container = 'https://depot.galaxyproject.org/singularity/nextclade:3.5.0--h9ee0642_0'
+        }
+        withName: 'KRAKEN2_KRAKEN2' {
+            publishDir = [
+                pattern: "*.{unclassified.fastq.gz,unclassified_1.fastq.gz,unclassified_2.fastq.gz,report.txt}"
+            ]
+        }
+        withName: 'MULTIQC' {
+        container = 'https://depot.galaxyproject.org/singularity/multiqc:1.19--pyhdfd78af_0'
+    }
+}
+
+params {
+        // Max resource options
+        max_memory = 376.GB
+        max_cpus = 32
+        max_time = '48.h'
+}

From a5b56efcb2e29b9a71ac29750e8c73aa5be3f34b Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 9 Sep 2024 10:29:53 +0200
Subject: [PATCH 230/321] Updated release version tag in __main__.py

---
 bu_isciii/__main__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/__main__.py b/bu_isciii/__main__.py
index 321bb172c..352bd6ab5 100755
--- a/bu_isciii/__main__.py
+++ b/bu_isciii/__main__.py
@@ -57,7 +57,7 @@ def run_bu_isciii():
     )
 
     # stderr.print("[green]                                          `._,._,'\n", highlight=False)
-    __version__ = "2.0.0"
+    __version__ = "2.1.0"
     stderr.print(
         "[grey39]    BU-ISCIII-tools version {}".format(__version__), highlight=False
     )

From b4c3ec2edcaea44378c91f05eaa709825dbd6119 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 9 Sep 2024 10:30:50 +0200
Subject: [PATCH 231/321] Updated get_service_paths function in utils.py to
 handle the profile classification area error

---
 bu_isciii/utils.py | 47 +++++++++++++++++++++++++---------------------
 1 file changed, 26 insertions(+), 21 deletions(-)

diff --git a/bu_isciii/utils.py b/bu_isciii/utils.py
index 07ba82939..da724c591 100755
--- a/bu_isciii/utils.py
+++ b/bu_isciii/utils.py
@@ -206,27 +206,32 @@ def get_service_paths(conf, type, info, archived_status):
     """
     global_conf = conf.get_configuration("global")
     service_path = None
-    if type == "services_and_colaborations":
-        if archived_status == "archived_path":
-            service_path = os.path.join(
-                global_conf["archived_path"],
-                type,
-                info["service_user_id"]["profile"]["profile_center"],
-                info["service_user_id"]["profile"][
-                    "profile_classification_area"
-                ].lower(),
-            )
-        if archived_status == "non_archived_path":
-            service_path = os.path.join(
-                global_conf["data_path"],
-                type,
-                info["service_user_id"]["profile"]["profile_center"],
-                info["service_user_id"]["profile"][
-                    "profile_classification_area"
-                ].lower(),
-            )
-    return service_path
-
+    
+    try:
+        if type == "services_and_colaborations":
+            if archived_status == "archived_path":
+                service_path = os.path.join(
+                    global_conf["archived_path"],
+                    type,
+                    info["service_user_id"]["profile"]["profile_center"],
+                    info["service_user_id"]["profile"][
+                        "profile_classification_area"
+                    ].lower(),
+                )
+            if archived_status == "non_archived_path":
+                service_path = os.path.join(
+                    global_conf["data_path"],
+                    type,
+                    info["service_user_id"]["profile"]["profile_center"],
+                    info["service_user_id"]["profile"][
+                        "profile_classification_area"
+                    ].lower(),
+                )
+        return service_path
+    
+    except AttributeError:
+        stderr.print("[red]ERROR: the user associated with this service has no profile classification area selected in iskylims.isciii.es/admin. Please log in, go to the Profiles section and make sure every user has been assigned a profile classification area.")
+        sys.exit(1)
 
 def get_sftp_folder(conf, resolution_info):
     service_user = resolution_info["service_user_id"]["username"]

From 75d682a0bf68ec3b2990515bbcab61cf7d5e2aae Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 9 Sep 2024 10:31:36 +0200
Subject: [PATCH 232/321] Updated pipeline version in rnaseq template

---
 .../templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog     | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog
index a39b66986..3ae1bb109 100644
--- a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog
+++ b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog
@@ -19,7 +19,7 @@ cat <<EOF > rnaseq.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-/data/bi/pipelines/nf-core-rnaseq/nf-core-rnaseq-3.10.1/workflow/main.nf \\
+/data/bi/pipelines/nf-core-rnaseq/nf-core-rnaseq-3.14.0/main.nf \\
           -c ../../DOC/hpc_slurm_rnaseq.config \\
           -params-file ../../DOC/hg38_ensmbl_rnaseq.yml \\
           --input samplesheet.csv \\

From 1743cee1cd828f699bf619364ee49a905a8602fd Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 9 Sep 2024 10:32:13 +0200
Subject: [PATCH 233/321] Corrected paths in characterization lablog

---
 .../ANALYSIS/ANALYSIS01_CHARACTERIZATION/99-stats/lablog  | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/99-stats/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/99-stats/lablog
index 9ab99ce9f..6e11ee3d9 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/99-stats/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/99-stats/lablog
@@ -1,6 +1,6 @@
 #conda activate python3
-python3 /data/bi/pipelines/bacterial_qc/parse_ariba.py --path ../02-ariba/summary/out_summary_card.csv --database card --output_bn ariba_card.bn --output_csv ariba_card.csv
-python3 /data/bi/pipelines/bacterial_qc/parse_ariba.py --path ../02-ariba/summary/out_summary_plasmidfinder.csv --database plasmidfinder --output_bn ariba_plasmidfinder.bn --output_csv ariba_plasmidfinder.csv
-python3 /data/bi/pipelines/bacterial_qc/parse_ariba.py --path ../02-ariba/summary/out_summary_vfdb_full.csv --database vfdb_full --output_bn ariba_vfdb_full.bn --output_csv ariba_vfdb_full.csv
+python3 /data/bi/pipelines/bacterial-qc/parse_ariba.py --path ../02-ariba/summary/out_summary_card.csv --database card --output_bn ariba_card.bn --output_csv ariba_card.csv
+python3 /data/bi/pipelines/bacterial-qc/parse_ariba.py --path ../02-ariba/summary/out_summary_plasmidfinder.csv --database plasmidfinder --output_bn ariba_plasmidfinder.bn --output_csv ariba_plasmidfinder.csv
+python3 /data/bi/pipelines/bacterial-qc/parse_ariba.py --path ../02-ariba/summary/out_summary_vfdb_full.csv --database vfdb_full --output_bn ariba_vfdb_full.bn --output_csv ariba_vfdb_full.csv
 
-paste <(echo "sample_id") <(cat ../02-ariba/run/*/out_pubmlst_*_run/mlst_report.tsv | head -n1) > ariba_mlst_full.tsv; cat ../samples_id.txt | while read in; do paste <(echo ${in}) <(tail -n1 ../02-ariba/run/${in}/out_pubmlst_${in}_run/mlst_report.tsv); done >> ariba_mlst_full.tsv
\ No newline at end of file
+paste <(echo "sample_id") <(cat ../02-ariba/run/*/out_pubmlst_*_run/mlst_report.tsv | head -n1) > ariba_mlst_full.tsv; cat ../samples_id.txt | while read in; do paste <(echo ${in}) <(tail -n1 ../02-ariba/run/${in}/out_pubmlst_${in}_run/mlst_report.tsv); done >> ariba_mlst_full.tsv

From 0a42dc70938fe165967f25fa2a767c40fc5f3740 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 9 Sep 2024 10:32:48 +0200
Subject: [PATCH 234/321] Added skip_asciigenome in viralrecon_params.yml

---
 bu_isciii/templates/viralrecon/DOC/viralrecon_params.yml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon_params.yml b/bu_isciii/templates/viralrecon/DOC/viralrecon_params.yml
index 447fb3fd5..8f854848c 100644
--- a/bu_isciii/templates/viralrecon/DOC/viralrecon_params.yml
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon_params.yml
@@ -7,3 +7,4 @@ skip_pangolin: true
 skip_nextclade: true
 skip_assembly: true
 skip_variants: false
+skip_asciigenome: true

From 919abca4d3411d52d4a811969b8e460976567b6b Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 9 Sep 2024 10:33:35 +0200
Subject: [PATCH 235/321] Created a .sh file to remove the first three columns
 of mapping_illumina.tab when necessary

---
 .../ANALYSIS/remove_columns_mapping_table.sh        | 13 +++++++++++++
 1 file changed, 13 insertions(+)
 create mode 100644 bu_isciii/templates/viralrecon/ANALYSIS/remove_columns_mapping_table.sh

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/remove_columns_mapping_table.sh b/bu_isciii/templates/viralrecon/ANALYSIS/remove_columns_mapping_table.sh
new file mode 100644
index 000000000..06f79c7f6
--- /dev/null
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/remove_columns_mapping_table.sh
@@ -0,0 +1,13 @@
+#!/bin/bash
+
+output_file=$(echo processed_mapping_illumina_$(date '+%Y%m%d').tab)
+
+# Removal of the first three columns of the mapping illumina tab file
+cut --complement -f1-3 *.tab > output_file
+
+# Success message
+if [ $? -eq 0 ]; then
+    echo "Successfully removed the first three columns from the mapping_illumina file and saved the output to $output_file."
+else
+    echo "An error occurred."
+fi

From e42f593f0b638ca7deddbde4dda0dd6f7ef3302f Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 9 Sep 2024 10:34:24 +0200
Subject: [PATCH 236/321] Updated mag pipeline version in the template

---
 .../templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog     | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog
index d68708d31..f25725d5b 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog
@@ -18,7 +18,7 @@ cat <<EOF > mag.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-2.5.3/workflow/main.nf \\
+nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-3.0.3/3_0_3/main.nf \\
           -c ../../DOC/mag.config \\
           --input '00-reads/*_R{1,2}.fastq.gz' \\
           --outdir $(date '+%Y%m%d')_mag \\

From c01d25f6d4fd985c66adf79c93fa7148aa91ac42 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 9 Sep 2024 10:35:15 +0200
Subject: [PATCH 237/321] Updated ariba singularity image in
 characterization/REFERENCES/lablog

---
 bu_isciii/templates/characterization/REFERENCES/lablog | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/characterization/REFERENCES/lablog b/bu_isciii/templates/characterization/REFERENCES/lablog
index c3226548c..673c7904d 100644
--- a/bu_isciii/templates/characterization/REFERENCES/lablog
+++ b/bu_isciii/templates/characterization/REFERENCES/lablog
@@ -31,12 +31,12 @@ print_color "This will take some seconds to display, please wait" 'blue'
 
 # Select genome from PMLST
 IFS=$'\n'
-bacterial_options=( $(singularity exec /data/bi/pipelines/singularity-images/ariba:2.14.6--py36h4aaaa08_3 ariba pubmlstspecies | sed 's/^/"/g' | sed 's/$/"/g') )
+bacterial_options=( $(singularity exec /data/bi/pipelines/singularity-images/ariba:2.14.6--py39heaaa4ec_6 ariba pubmlstspecies | sed 's/^/"/g' | sed 's/$/"/g') )
 print_color "Indicate the preferred bacterial genome:" 'blue'
 select BACTERIA in "${bacterial_options[@]}"; do
     if [ -n "$BACTERIA" ]; then
         print_color "Selected bacteria: $BACTERIA" 'green'
-        echo "srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name PUBMLSTGET --output logs/PUBMLSTGET.%j.log --partition short_idx --cpus-per-task 5 singularity exec /data/bi/pipelines/singularity-images/ariba:2.14.6--py36h4aaaa08_3 ariba pubmlstget $BACTERIA $(date '+%Y%m%d') &" > _01_download_pubmlst.sh
+        echo "srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name PUBMLSTGET --output logs/PUBMLSTGET.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir} /data/bi/pipelines/singularity-images/ariba:2.14.6--py39heaaa4ec_6 ariba pubmlstget $BACTERIA $(date '+%Y%m%d') &" > _01_download_pubmlst.sh
         break
     else
         print_color "Invalid input. Please select a valid option." 'red'

From 6f11842ab79b870e6f3999cc75d152ab6d0d436a Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 9 Sep 2024 10:43:05 +0200
Subject: [PATCH 238/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index c4343a4cb..4bb905aa2 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -67,6 +67,7 @@ Code contributions to the new version:
 - Added new template for comprehensive taxonomy profiling using the nf-core/taxprofiler pipeline [#320](https://github.com/BU-ISCIII/buisciii-tools/pull/320).
 - Added full execution support for the MAG template [#321](https://github.com/BU-ISCIII/buisciii-tools/pull/321).
 - Added labels to services.json and updated bioinfo_doc.py and jinja_template_delivery.j2 so that software versions data is displayed in the delivery pdf [#330](https://github.com/BU-ISCIII/buisciii-tools/pull/330).
+- Updated several templates (singularity images, outdated paths, improvements, etc) [#331](https://github.com/BU-ISCIII/buisciii-tools/pull/331)
 
 ### Modules
 

From 359df2d1b656d54cd301ed042479be4f6d87164d Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 9 Sep 2024 11:28:20 +0200
Subject: [PATCH 239/321] Created MLVA template as part of characterization

---
 .../05-mlva/lablog                            | 23 +++++++++++++++++++
 1 file changed, 23 insertions(+)
 create mode 100644 bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/05-mlva/lablog

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/05-mlva/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/05-mlva/lablog
new file mode 100644
index 000000000..fb6159b6b
--- /dev/null
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/05-mlva/lablog
@@ -0,0 +1,23 @@
+# micromamba activate buisciii-tools_2.1.0
+
+mkdir logs
+mkdir assemblies
+mkdir MLVA_output
+scratch_dir=$(pwd | sed 's|/data/bi/scratch_tmp|/scratch|g')
+cp ../../*_ASSEMBLY/03-assembly/unicycler/*.fasta* assemblies/
+gzip -d assemblies/*.fasta.gz
+available_primers=$(ls /data/bi/references/MLVA/*primer* | rev | cut -d "/" -f1 | rev | cut -d "_" -f1)
+
+echo "Available primers:"
+select primer in $available_primers; do
+    if [ -n "$primer" ]; then
+        echo "You selected: $primer"
+        break
+    else
+        echo "Invalid selection. Please try again."
+    fi
+done
+
+primer_file=$(ls /data/bi/references/MLVA/${primer}*)
+
+echo "srun --partition short_idx --chdir ${scratch_dir} --output logs/MLVA.log --job-name MLVA python /data/bi/pipelines/mlva/MLVA_finder.py -c -i assemblies -o MLVA_output -p ${primer_file} --full-locus-name --predicted-PCR-size-table --flanking-seq 20 &"  > _01_mlva.sh

From 5a2e7c40408f05723d01bfb8c17ccb8d533269f7 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 9 Sep 2024 11:36:24 +0200
Subject: [PATCH 240/321] Fixed linting mistakes

---
 bu_isciii/utils.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/utils.py b/bu_isciii/utils.py
index da724c591..1332b1e1c 100755
--- a/bu_isciii/utils.py
+++ b/bu_isciii/utils.py
@@ -206,7 +206,7 @@ def get_service_paths(conf, type, info, archived_status):
     """
     global_conf = conf.get_configuration("global")
     service_path = None
-    
+
     try:
         if type == "services_and_colaborations":
             if archived_status == "archived_path":
@@ -228,11 +228,12 @@ def get_service_paths(conf, type, info, archived_status):
                     ].lower(),
                 )
         return service_path
-    
+
     except AttributeError:
         stderr.print("[red]ERROR: the user associated with this service has no profile classification area selected in iskylims.isciii.es/admin. Please log in, go to the Profiles section and make sure every user has been assigned a profile classification area.")
         sys.exit(1)
 
+
 def get_sftp_folder(conf, resolution_info):
     service_user = resolution_info["service_user_id"]["username"]
     json_file = os.path.join(os.path.dirname(__file__), "templates", "sftp_user.json")

From aaddfcc5a935f3948087c14045045f19678d1acd Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 9 Sep 2024 11:37:43 +0200
Subject: [PATCH 241/321] Ran black on utils.py

---
 bu_isciii/utils.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/utils.py b/bu_isciii/utils.py
index 1332b1e1c..6de43fe02 100755
--- a/bu_isciii/utils.py
+++ b/bu_isciii/utils.py
@@ -230,7 +230,9 @@ def get_service_paths(conf, type, info, archived_status):
         return service_path
 
     except AttributeError:
-        stderr.print("[red]ERROR: the user associated with this service has no profile classification area selected in iskylims.isciii.es/admin. Please log in, go to the Profiles section and make sure every user has been assigned a profile classification area.")
+        stderr.print(
+            "[red]ERROR: the user associated with this service has no profile classification area selected in iskylims.isciii.es/admin. Please log in, go to the Profiles section and make sure every user has been assigned a profile classification area."
+        )
         sys.exit(1)
 
 

From 7ae2ec72e7541915273551bc2d375b63dc904748 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 10 Sep 2024 14:00:19 +0200
Subject: [PATCH 242/321] Added a permissions field in the global section

---
 bu_isciii/conf/configuration.json | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)
 mode change 100755 => 100644 bu_isciii/conf/configuration.json

diff --git a/bu_isciii/conf/configuration.json b/bu_isciii/conf/configuration.json
old mode 100755
new mode 100644
index d4e4f86ea..b1ce926eb
--- a/bu_isciii/conf/configuration.json
+++ b/bu_isciii/conf/configuration.json
@@ -2,7 +2,11 @@
     "global": {
         "data_path": "/data/bi",
         "archived_path": "/archived/bi",
-        "yaml_conf_path": "~/buisciii_config.yml"
+        "yaml_conf_path": "~/buisciii_config.yml",
+        "permissions": {
+        "directory_chmod": "775",
+        "file_chmod": "664"
+        }
     },
     "sftp_copy": {
         "protocol": "rsync",

From 59061ea7cd8f6ab83f0a65cfe8da484d6863e107 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 10 Sep 2024 14:01:45 +0200
Subject: [PATCH 243/321] Added a remake_permissions() function to utils.py to
 allow permissions correction

---
 bu_isciii/utils.py | 28 ++++++++++++++++++++++++++++
 1 file changed, 28 insertions(+)

diff --git a/bu_isciii/utils.py b/bu_isciii/utils.py
index 6de43fe02..b2832d5c5 100755
--- a/bu_isciii/utils.py
+++ b/bu_isciii/utils.py
@@ -7,6 +7,7 @@
 import os
 import tarfile
 import sys
+import subprocess
 
 import questionary
 import rich
@@ -495,3 +496,30 @@ def process_yaml_file(yaml_file):
 
 def validate_date(date_previous, date_posterior):
     return
+
+
+def remake_permissions(copied_folder_path, permissions_config):
+    """
+    Change permissions of all files and directories in a given absolute path.
+
+    Args:
+        copied_folder_path: The path to the folder that was copied
+        permissions_config: Dictionary containing permissions configuration (e.g., {'directory_chmod': '755', 'file_chmod': '664'})
+    """
+    for root, dirs, files in os.walk(copied_folder_path):
+        # Full paths for directories
+        dirpaths = [os.path.join(root, dir) for dir in dirs]
+
+        # Full paths for files
+        filepaths = [os.path.join(root, file) for file in files]
+
+        # Change permissions for directories
+        for dir_path in dirpaths:
+            if "directory_chmod" in permissions_config:
+                subprocess.run(f"chown -R $(whoami):bi {copied_folder_path}", shell=True, check=True)
+                subprocess.run(f"find {copied_folder_path} -type d -exec chmod {permissions_config['directory_chmod']} {{}} \;", shell=True, check=True)
+
+        # Change permissions for files
+        for file_path in filepaths:
+            if "file_chmod" in permissions_config:
+                subprocess.run(f"find {copied_folder_path} -type f -exec chmod {permissions_config['file_chmod']} {{}} \;", shell=True, check=True)

From 3259d885582e8cca6e2d6a5d24737af4c8cb5bf6 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 10 Sep 2024 14:02:43 +0200
Subject: [PATCH 244/321] Updated scratch.py to always make permissions correct
 after copying files to the service folder

---
 bu_isciii/scratch.py | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/bu_isciii/scratch.py b/bu_isciii/scratch.py
index d165c8e92..3c9cb77aa 100755
--- a/bu_isciii/scratch.py
+++ b/bu_isciii/scratch.py
@@ -187,6 +187,12 @@ def revert_copy_scratch(self):
                             sync_source_contents=False,
                         )
                         self.srun_command(self.srun_settings, rsync_command)
+
+                        # After successful rsync, apply correct permissions
+                        conf = bu_isciii.config_json.ConfigJson()
+                        permissions_config = conf.get_configuration("global").get("permissions")
+                        bu_isciii.utils.remake_permissions(self.full_path, permissions_config)
+
                         stderr.print(
                             "[green]Successfully copied the directory to %s"
                             % dest_folder,

From c2094585acaa934816ec5ded68b7d457feca3676 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 10 Sep 2024 14:03:17 +0200
Subject: [PATCH 245/321] Added a new bu-isciii function to fix permissions of
 a custom folder

---
 bu_isciii/__main__.py | 25 +++++++++++++++++++++++++
 1 file changed, 25 insertions(+)

diff --git a/bu_isciii/__main__.py b/bu_isciii/__main__.py
index 352bd6ab5..4e59a91dd 100755
--- a/bu_isciii/__main__.py
+++ b/bu_isciii/__main__.py
@@ -649,5 +649,30 @@ def autoclean_sftp(ctx, sftp_folder, days):
     sftp_clean.handle_autoclean_sftp()
 
 
+# FIX PERMISSIONS
+@bu_isciii_cli.command(help_priority=9)
+@click.option(
+    "-d",
+    "--input_directory",
+    type=click.Path(),
+    default=None,
+    required=True,
+    help="Input directory to fix permissions (absolute path)",
+)
+@click.pass_context
+def fix_permissions(ctx, input_directory):
+    """
+    Fix permissions
+    """
+    if not os.path.isdir(input_directory):
+        exit("Invalid input directory")
+    conf = bu_isciii.config_json.ConfigJson()
+    permissions = conf.get_configuration("global").get("permissions")
+    bu_isciii.utils.remake_permissions(input_directory, permissions)
+    stderr = rich.console.Console(
+        stderr=True, force_terminal=bu_isciii.utils.rich_force_colors()
+    )
+    stderr.print(f"[green]Correct permissions were applied to {input_directory}")
+
 if __name__ == "__main__":
     run_bu_isciii()

From 1f09726842db582625fdc4c2b7f886f4662b950a Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 10 Sep 2024 14:12:40 +0200
Subject: [PATCH 246/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 4bb905aa2..d8356c716 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -68,6 +68,7 @@ Code contributions to the new version:
 - Added full execution support for the MAG template [#321](https://github.com/BU-ISCIII/buisciii-tools/pull/321).
 - Added labels to services.json and updated bioinfo_doc.py and jinja_template_delivery.j2 so that software versions data is displayed in the delivery pdf [#330](https://github.com/BU-ISCIII/buisciii-tools/pull/330).
 - Updated several templates (singularity images, outdated paths, improvements, etc) [#331](https://github.com/BU-ISCIII/buisciii-tools/pull/331)
+- Added permissions fixing after running scratch_copy, as well as a new fix-permissions module in the tools [#332](https://github.com/BU-ISCIII/buisciii-tools/pull/332).
 
 ### Modules
 

From 175f1a261dd830bbaf1ebc2c6f23a26515cd3ba5 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 10 Sep 2024 14:15:20 +0200
Subject: [PATCH 247/321] Fixed linting mistake

---
 bu_isciii/__main__.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bu_isciii/__main__.py b/bu_isciii/__main__.py
index 4e59a91dd..16e99303d 100755
--- a/bu_isciii/__main__.py
+++ b/bu_isciii/__main__.py
@@ -674,5 +674,6 @@ def fix_permissions(ctx, input_directory):
     )
     stderr.print(f"[green]Correct permissions were applied to {input_directory}")
 
+
 if __name__ == "__main__":
     run_bu_isciii()

From 10906ed12f2d55ccd551fa92983c31d5082f84cb Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 10 Sep 2024 14:17:18 +0200
Subject: [PATCH 248/321] Ran black on scratch.py and utils.py

---
 bu_isciii/scratch.py |  8 ++++++--
 bu_isciii/utils.py   | 18 +++++++++++++++---
 2 files changed, 21 insertions(+), 5 deletions(-)

diff --git a/bu_isciii/scratch.py b/bu_isciii/scratch.py
index 3c9cb77aa..529493abc 100755
--- a/bu_isciii/scratch.py
+++ b/bu_isciii/scratch.py
@@ -190,8 +190,12 @@ def revert_copy_scratch(self):
 
                         # After successful rsync, apply correct permissions
                         conf = bu_isciii.config_json.ConfigJson()
-                        permissions_config = conf.get_configuration("global").get("permissions")
-                        bu_isciii.utils.remake_permissions(self.full_path, permissions_config)
+                        permissions_config = conf.get_configuration("global").get(
+                            "permissions"
+                        )
+                        bu_isciii.utils.remake_permissions(
+                            self.full_path, permissions_config
+                        )
 
                         stderr.print(
                             "[green]Successfully copied the directory to %s"
diff --git a/bu_isciii/utils.py b/bu_isciii/utils.py
index b2832d5c5..62248c0bb 100755
--- a/bu_isciii/utils.py
+++ b/bu_isciii/utils.py
@@ -516,10 +516,22 @@ def remake_permissions(copied_folder_path, permissions_config):
         # Change permissions for directories
         for dir_path in dirpaths:
             if "directory_chmod" in permissions_config:
-                subprocess.run(f"chown -R $(whoami):bi {copied_folder_path}", shell=True, check=True)
-                subprocess.run(f"find {copied_folder_path} -type d -exec chmod {permissions_config['directory_chmod']} {{}} \;", shell=True, check=True)
+                subprocess.run(
+                    f"chown -R $(whoami):bi {copied_folder_path}",
+                    shell=True,
+                    check=True,
+                )
+                subprocess.run(
+                    f"find {copied_folder_path} -type d -exec chmod {permissions_config['directory_chmod']} {{}} \;",
+                    shell=True,
+                    check=True,
+                )
 
         # Change permissions for files
         for file_path in filepaths:
             if "file_chmod" in permissions_config:
-                subprocess.run(f"find {copied_folder_path} -type f -exec chmod {permissions_config['file_chmod']} {{}} \;", shell=True, check=True)
+                subprocess.run(
+                    f"find {copied_folder_path} -type f -exec chmod {permissions_config['file_chmod']} {{}} \;",
+                    shell=True,
+                    check=True,
+                )

From 3cdc353e671f22299bf01de28a160b99fa5cb776 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 10 Sep 2024 16:30:30 +0200
Subject: [PATCH 249/321] Used 2775 for directory chmod in configuration.json

---
 bu_isciii/conf/configuration.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/conf/configuration.json b/bu_isciii/conf/configuration.json
index b1ce926eb..3551c2766 100644
--- a/bu_isciii/conf/configuration.json
+++ b/bu_isciii/conf/configuration.json
@@ -4,7 +4,7 @@
         "archived_path": "/archived/bi",
         "yaml_conf_path": "~/buisciii_config.yml",
         "permissions": {
-        "directory_chmod": "775",
+        "directory_chmod": "2775",
         "file_chmod": "664"
         }
     },

From 1b357d4449b69aa9ecf31f5eca7a4bf7e3347e00 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 10 Sep 2024 16:31:20 +0200
Subject: [PATCH 250/321] Simplified the remake_permissions() function in
 utils.py

---
 bu_isciii/utils.py | 36 ++++++++----------------------------
 1 file changed, 8 insertions(+), 28 deletions(-)

diff --git a/bu_isciii/utils.py b/bu_isciii/utils.py
index 62248c0bb..f50f77583 100755
--- a/bu_isciii/utils.py
+++ b/bu_isciii/utils.py
@@ -506,32 +506,12 @@ def remake_permissions(copied_folder_path, permissions_config):
         copied_folder_path: The path to the folder that was copied
         permissions_config: Dictionary containing permissions configuration (e.g., {'directory_chmod': '755', 'file_chmod': '664'})
     """
-    for root, dirs, files in os.walk(copied_folder_path):
-        # Full paths for directories
-        dirpaths = [os.path.join(root, dir) for dir in dirs]
-
-        # Full paths for files
-        filepaths = [os.path.join(root, file) for file in files]
-
-        # Change permissions for directories
-        for dir_path in dirpaths:
-            if "directory_chmod" in permissions_config:
-                subprocess.run(
-                    f"chown -R $(whoami):bi {copied_folder_path}",
-                    shell=True,
-                    check=True,
-                )
-                subprocess.run(
-                    f"find {copied_folder_path} -type d -exec chmod {permissions_config['directory_chmod']} {{}} \;",
-                    shell=True,
-                    check=True,
-                )
+    subprocess.run(f"chown -R $(whoami):bi {copied_folder_path}", shell=True, check=True)
 
-        # Change permissions for files
-        for file_path in filepaths:
-            if "file_chmod" in permissions_config:
-                subprocess.run(
-                    f"find {copied_folder_path} -type f -exec chmod {permissions_config['file_chmod']} {{}} \;",
-                    shell=True,
-                    check=True,
-                )
+    # Change permissions for directories
+    if "directory_chmod" in permissions_config:
+        subprocess.run(f"find {copied_folder_path} -type d -exec chmod {permissions_config['directory_chmod']} {{}} \;", shell=True, check=True)
+
+    # Change permissions for files
+    if "file_chmod" in permissions_config:
+        subprocess.run(f"find {copied_folder_path} -type f -exec chmod {permissions_config['file_chmod']} {{}} \;", shell=True, check=True)

From 28efba0b0c9cae9cc5eac1eebc509859721e7877 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 10 Sep 2024 16:32:54 +0200
Subject: [PATCH 251/321] Ran black on utils.py

---
 bu_isciii/utils.py | 16 +++++++++++++---
 1 file changed, 13 insertions(+), 3 deletions(-)

diff --git a/bu_isciii/utils.py b/bu_isciii/utils.py
index f50f77583..eca3c484d 100755
--- a/bu_isciii/utils.py
+++ b/bu_isciii/utils.py
@@ -506,12 +506,22 @@ def remake_permissions(copied_folder_path, permissions_config):
         copied_folder_path: The path to the folder that was copied
         permissions_config: Dictionary containing permissions configuration (e.g., {'directory_chmod': '755', 'file_chmod': '664'})
     """
-    subprocess.run(f"chown -R $(whoami):bi {copied_folder_path}", shell=True, check=True)
+    subprocess.run(
+        f"chown -R $(whoami):bi {copied_folder_path}", shell=True, check=True
+    )
 
     # Change permissions for directories
     if "directory_chmod" in permissions_config:
-        subprocess.run(f"find {copied_folder_path} -type d -exec chmod {permissions_config['directory_chmod']} {{}} \;", shell=True, check=True)
+        subprocess.run(
+            f"find {copied_folder_path} -type d -exec chmod {permissions_config['directory_chmod']} {{}} \;",
+            shell=True,
+            check=True,
+        )
 
     # Change permissions for files
     if "file_chmod" in permissions_config:
-        subprocess.run(f"find {copied_folder_path} -type f -exec chmod {permissions_config['file_chmod']} {{}} \;", shell=True, check=True)
+        subprocess.run(
+            f"find {copied_folder_path} -type f -exec chmod {permissions_config['file_chmod']} {{}} \;",
+            shell=True,
+            check=True,
+        )

From 01ebf4515b7a582cfe9a15fafc6bb3963ffccb97 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 11 Sep 2024 10:47:43 +0200
Subject: [PATCH 252/321] Updated mag lablogs so that they can be used with the
 3.0.3 version

---
 .../mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog        | 9 ++++++++-
 .../templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog     | 3 +--
 2 files changed, 9 insertions(+), 3 deletions(-)

diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog
index f25725d5b..87b7052a1 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog
@@ -1,6 +1,13 @@
+# SETUP INTPUT SAMPLE SHEET
 ln -s ../00-reads .
 ln -s ../samples_id.txt .
 
+# Setup samplesheet
+echo "sample,group,short_reads_1,short_reads_2,long_reads" > samplesheet.csv
+cat samples_id.txt | while read in; do
+        echo "${in},,00-reads/${in}_R1.fastq.gz,00-reads/${in}_R2.fastq.gz,"
+done >> samplesheet.csv
+
 #module load Nextflow
 #module load singularity
 
@@ -20,7 +27,7 @@ export NXF_OPTS="-Xms500M -Xmx4G"
 
 nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-3.0.3/3_0_3/main.nf \\
           -c ../../DOC/mag.config \\
-          --input '00-reads/*_R{1,2}.fastq.gz' \\
+          --input samplesheet.csv \\
           --outdir $(date '+%Y%m%d')_mag \\
           --kraken2_db /data/bi/references/kraken/minikraken_8GB_20200312.tgz \\
           --skip_busco --skip_spades --skip_spadeshybrid --skip_megahit --skip_prodigal --skip_binning \\
diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
index 46875ca53..76d7ff8e1 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
@@ -10,7 +10,6 @@ done >> samplesheet.csv
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-
 cat <<EOF > mag_all.sbatch
 #!/bin/sh
 #SBATCH --ntasks 1
@@ -24,7 +23,7 @@ cat <<EOF > mag_all.sbatch
 # module load Nextflow/23.10.0 singularity
 export NXF_OPTS="-Xms500M -Xmx8G"
 
-nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-2.5.3/workflow/main.nf \\
+nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-3.0.3/3_0_3/main.nf \\
     -c ../../DOC/mag.config \\
     -profile singularity \\
     --input samplesheet.csv \\

From 6b574138151ed2fa0b6993f01e6fa9465fe04ee0 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 11 Sep 2024 10:48:10 +0200
Subject: [PATCH 253/321] Updated the get_md5() function

---
 bu_isciii/utils.py | 15 ++++++---------
 1 file changed, 6 insertions(+), 9 deletions(-)

diff --git a/bu_isciii/utils.py b/bu_isciii/utils.py
index eca3c484d..910dc1e18 100755
--- a/bu_isciii/utils.py
+++ b/bu_isciii/utils.py
@@ -319,18 +319,15 @@ def uncompress_targz_directory(tar_name, directory):
     return
 
 
-def get_md5(file):
+def get_md5(file_path, chunk_size=1 * 1024 * 1024 * 1024):  # 1 GB
     """
     Given a file, open it and digest to get the md5
-    NOTE: might be troublesome when infile is too big
-    Based on:
-    https://www.quickprogrammingtips.com/python/how-to-calculate-md5-hash-of-a-file-in-python.html
     """
-    with open(file, "rb") as infile:
-        infile = infile.read()
-        file_md5 = hashlib.md5(infile).hexdigest()
-
-    return file_md5
+    hash_md5 = hashlib.md5()
+    with open(file_path, "rb") as f:
+        for chunk in iter(lambda: f.read(chunk_size), b""):
+            hash_md5.update(chunk)
+    return hash_md5.hexdigest()
 
 
 def ask_date(previous_date=None, posterior_date=None, initial_year=2010):

From 6a56e68e5611777dc825c058f6c1ce302b0c0c91 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 11 Sep 2024 10:55:28 +0200
Subject: [PATCH 254/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index d8356c716..8313ac697 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -69,6 +69,7 @@ Code contributions to the new version:
 - Added labels to services.json and updated bioinfo_doc.py and jinja_template_delivery.j2 so that software versions data is displayed in the delivery pdf [#330](https://github.com/BU-ISCIII/buisciii-tools/pull/330).
 - Updated several templates (singularity images, outdated paths, improvements, etc) [#331](https://github.com/BU-ISCIII/buisciii-tools/pull/331)
 - Added permissions fixing after running scratch_copy, as well as a new fix-permissions module in the tools [#332](https://github.com/BU-ISCIII/buisciii-tools/pull/332).
+- Updated MAG lablogs and utils.py [#334](https://github.com/BU-ISCIII/buisciii-tools/pull/334).
 
 ### Modules
 

From 477f67237954c459197d375f9aa23c99691c14c3 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 11 Sep 2024 11:03:09 +0200
Subject: [PATCH 255/321] Updated sftp_user.json

---
 bu_isciii/templates/sftp_user.json | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/sftp_user.json b/bu_isciii/templates/sftp_user.json
index 2461c05d9..bc7f4528a 100755
--- a/bu_isciii/templates/sftp_user.json
+++ b/bu_isciii/templates/sftp_user.json
@@ -53,5 +53,6 @@
     "mvmoneo": ["SpainUDP"],
     "bbaladron": ["SpainUDP"],
     "bioinfoadm": ["test"],
-    "s.varona": ["misc"]
+    "s.varona": ["misc"],
+    "nlabiod": ["Labarbovirus"]
 }

From fa0cae45bd851979d28bc70fcf0aaa4894ac9524 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 11 Sep 2024 15:45:03 +0200
Subject: [PATCH 256/321] Updated setup.py

---
 setup.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/setup.py b/setup.py
index dcda6436a..efa93a594 100755
--- a/setup.py
+++ b/setup.py
@@ -2,7 +2,7 @@
 
 from setuptools import setup, find_packages
 
-version = "2.1.0"
+version = "2.2.0"
 
 with open("README.md") as f:
     readme = f.read()

From 94c0b2fd4ce441c8fe898f951599d36fbbeaee99 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 11 Sep 2024 15:48:29 +0200
Subject: [PATCH 257/321] Updated version tag in __main__.py

---
 bu_isciii/__main__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/__main__.py b/bu_isciii/__main__.py
index 16e99303d..3933a0272 100755
--- a/bu_isciii/__main__.py
+++ b/bu_isciii/__main__.py
@@ -57,7 +57,7 @@ def run_bu_isciii():
     )
 
     # stderr.print("[green]                                          `._,._,'\n", highlight=False)
-    __version__ = "2.1.0"
+    __version__ = "2.2.0"
     stderr.print(
         "[grey39]    BU-ISCIII-tools version {}".format(__version__), highlight=False
     )

From f335695bad98d63dff04ec46aee1dc97096f9565 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 11 Sep 2024 15:50:26 +0200
Subject: [PATCH 258/321] Fixed a minor mistake in bioinfo_doc.py

---
 bu_isciii/bioinfo_doc.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index 7852c423c..4da846728 100755
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -187,6 +187,7 @@ def __init__(
         self.samples = self.resolution_info.get("samples", None)
         self.versions = self.load_versions()
         self.handled_services = None
+        self.all_services = None
         try:
             self.config_pdfkit = pdfkit.configuration()
         except OSError as e:

From a22f57b442ffc12a9cbf6437ac81b6127de267bd Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 11 Sep 2024 15:55:12 +0200
Subject: [PATCH 259/321] Updated the remove_columns_mapping_table.sh script

---
 .../viralrecon/ANALYSIS/remove_columns_mapping_table.sh        | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/remove_columns_mapping_table.sh b/bu_isciii/templates/viralrecon/ANALYSIS/remove_columns_mapping_table.sh
index 06f79c7f6..434c51c92 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/remove_columns_mapping_table.sh
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/remove_columns_mapping_table.sh
@@ -3,7 +3,8 @@
 output_file=$(echo processed_mapping_illumina_$(date '+%Y%m%d').tab)
 
 # Removal of the first three columns of the mapping illumina tab file
-cut --complement -f1-3 *.tab > output_file
+cut --complement -f1-3 mapping_*.tab > output_file
+mv $output_file mapping_illumina_$(date '+%Y%m%d').tab
 
 # Success message
 if [ $? -eq 0 ]; then

From 6b76d88e5165dab86bdb1bec8fb7345dd559cef9 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 11 Sep 2024 15:55:47 +0200
Subject: [PATCH 260/321] Updated README.md

---
 README.md | 23 +++++++++++++++++++++++
 1 file changed, 23 insertions(+)

diff --git a/README.md b/README.md
index fa4f2e68f..da5522a9f 100644
--- a/README.md
+++ b/README.md
@@ -21,6 +21,7 @@ BU-ISCIII provides a serie or services in its portfolio for supporting bioinform
       - [bioinfo\_doc](#bioinfo_doc)
       - [archive](#archive)
       - [autoclean\_sftp](#autoclean_sftp)
+      - [fix-permissions](#fix-permissions)
   - [Acknowledgements](#acknowledgements)
 
 ## Installation
@@ -94,6 +95,8 @@ Commands:
   finish       Service cleaning, remove big files, rename folders before...
   bioinfo-doc  Create the folder documentation structure in bioinfo_doc...
   archive      Archive services or retrieve services from archive
+  autoclean-sftp   Clean old sftp services
+  fix-permissions  Fix permissions
 ```
 
 #### list
@@ -389,6 +392,26 @@ Options:
   --help                  Show this message and exit.
 ```
 
+#### fix-permissions
+
+Example of usage:
+
+```bash
+bu-isciii fix-permissions -d /data/bi
+```
+
+Help:
+
+```bash
+Usage: bu-isciii fix-permissions [OPTIONS]
+
+  Fix permissions
+
+Options:
+  -d, --input_directory PATH  Input directory to fix permissions (absolute path) [required]
+  --help                  Show this message and exit.
+```
+
 ## Acknowledgements
 
 Python package idea and design is really inspired in [nf-core/tools](https://github.com/nf-core/tools).

From 4d7207a4980d593ca78a10bf6f7cb3602d3223a0 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 11 Sep 2024 15:56:00 +0200
Subject: [PATCH 261/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 42 +++++++++++++++++++++---------------------
 1 file changed, 21 insertions(+), 21 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 8313ac697..248b943c4 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -4,7 +4,27 @@ All notable changes to this project will be documented in this file.
 
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/), and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
-## [2.2.Xdev] - 2024-0X-XX : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.2.X
+## [2.X.Xdev] - 2024-0X-XX : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.X.X
+
+### Credits
+
+Code contributions to the new version:
+
+### Template fixes and updates
+
+### Modules
+
+#### Added enhancements
+
+#### Fixes
+
+#### Changed
+
+#### Removed
+
+### Requirements
+
+## [2.2.0] - 2024-09-12 : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.2.0
 
 ### Credits
 
@@ -96,26 +116,6 @@ Code contributions to the new version:
 
 ### Requirements
 
-## [2.X.1hot] - 2024-0X-0X : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.X.1
-
-### Credits
-
-Code contributions to the hotfix:
-
-### Template fixes and updates
-
-### Modules
-
-#### Added enhancements
-
-#### Fixes
-
-#### Changed
-
-#### Removed
-
-### Requirements
-
 ## [2.1.0] - 2024-04-19 : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.1.0
 
 ### Credits

From 0217dcee5dcac23861fc2f5bcdd3d5d3c0e6dfe7 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 12 Sep 2024 09:55:24 +0200
Subject: [PATCH 262/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 248b943c4..c2f9777fa 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -90,6 +90,7 @@ Code contributions to the new version:
 - Updated several templates (singularity images, outdated paths, improvements, etc) [#331](https://github.com/BU-ISCIII/buisciii-tools/pull/331)
 - Added permissions fixing after running scratch_copy, as well as a new fix-permissions module in the tools [#332](https://github.com/BU-ISCIII/buisciii-tools/pull/332).
 - Updated MAG lablogs and utils.py [#334](https://github.com/BU-ISCIII/buisciii-tools/pull/334).
+- Updated some files (setup.py, __main__.py, README, etc) for the 2.2.0 release [#335](https://github.com/BU-ISCIII/buisciii-tools/pull/335).
 
 ### Modules
 

From 98ae82cd8ebf1b64fa1060706f77f8993244b413 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Thu, 12 Sep 2024 10:35:05 +0200
Subject: [PATCH 263/321] Added 2.X.Xhot section to CHANGELOG.md

---
 CHANGELOG.md | 20 ++++++++++++++++++++
 1 file changed, 20 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index c2f9777fa..4ee3575ed 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -24,6 +24,26 @@ Code contributions to the new version:
 
 ### Requirements
 
+## [2.X.Xhot] - 2024-0X-0X : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.X.1
+
+### Credits
+
+Code contributions to the hotfix:
+
+### Template fixes and updates
+
+### Modules
+
+#### Added enhancements
+
+#### Fixes
+
+#### Changed
+
+#### Removed
+
+### Requirements
+
 ## [2.2.0] - 2024-09-12 : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.2.0
 
 ### Credits

From 16c0990a0bfa7c5eea30d8887cece432d8be51a3 Mon Sep 17 00:00:00 2001
From: "github-actions[bot]"
 <41898282+github-actions[bot]@users.noreply.github.com>
Date: Thu, 12 Sep 2024 12:51:12 +0200
Subject: [PATCH 264/321] Merge changes from main into hotfix (#195) (#337)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com>
Co-authored-by: Sara Monzón <sara.monzon.fdz@gmail.com>
Co-authored-by: Pablo Mata <76519482+Shettland@users.noreply.github.com>
Co-authored-by: Víctor López <98259577+victor5lm@users.noreply.github.com>

From cadb3e8c9ef9fdf5122fe9f94be225c4d3e721d7 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Thu, 12 Sep 2024 13:21:21 +0200
Subject: [PATCH 265/321] fixed path database and update emmtyper params

---
 .../ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog        | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
index d5897933c..342dcfbda 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
@@ -53,7 +53,7 @@ cat <<EOF > _01_emmtyper.sbatch
 # create results folder
 mkdir -p 01-typing
 mkdir -p 01-typing/tmps
-blastdb_path=/data/bi/references/cdc_emm_blastdb
+blastdb_path=/data/bi/references/cdc_emm_blastdb/20240509
 
 # Run emmtyper
 singularity exec \\
@@ -63,9 +63,9 @@ singularity exec \\
     /data/bi/pipelines/singularity-images/singularity-emmtyper.0.2.0--py_0 emmtyper \\
     -w blast \\
     --keep \\
-    --blast_db "\${blastdb_path}/cdc_emm_database29042024" \\
-    --percent-identity 95 \\
-    --culling-limit 5 \\
+    --blast_db "\${blastdb_path}/cdc_emm_database" \\
+    --percent-identity 100 \\
+    --culling-limit 5 \
     --output 01-typing/results_emmtyper.out \\
     --output-format verbose \\
     ./fasta_inputs/*.fasta

From bfc74b2146e40b63a4298e5dbbee4612f5c89433 Mon Sep 17 00:00:00 2001
From: Dani VM <da.valle@isciii.es>
Date: Thu, 12 Sep 2024 13:31:09 +0200
Subject: [PATCH 266/321] update changelog #339

---
 CHANGELOG.md | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 4ee3575ed..35bd73635 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -9,8 +9,11 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 ### Credits
 
 Code contributions to the new version:
+- [Daniel Valle](https://github.com/Daniel-VM)
+
 
 ### Template fixes and updates
+- Fixed path to blast database and update Emmtyper params [#339](https://github.com/BU-ISCIII/buisciii-tools/pull/339)
 
 ### Modules
 

From e8de24768d403cf6e7e2310928d2db0d33cf97fd Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Sergio=20Olmos=20Pi=C3=B1ero?=
 <103578874+OPSergio@users.noreply.github.com>
Date: Thu, 19 Sep 2024 16:20:00 +0200
Subject: [PATCH 267/321] update sarek version in exomeeb (#341)

* update sarek version in exomeeb

* Updated sarek version (v3.4.4) in ExomeEB-ExomeTrio-WGSTrio templates

* Current version Nextflow
---
 CHANGELOG.md                                                  | 2 +-
 bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/lablog  | 4 ++--
 .../templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/lablog      | 2 +-
 bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/lablog | 4 ++--
 4 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 35bd73635..c899f7d99 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -14,7 +14,7 @@ Code contributions to the new version:
 
 ### Template fixes and updates
 - Fixed path to blast database and update Emmtyper params [#339](https://github.com/BU-ISCIII/buisciii-tools/pull/339)
-
+- Updated sarek version (v3.4.4) in ExomeEB-ExomeTrio-WGSTrio templates [#341] (https://github.com/BU-ISCIII/buisciii-tools/pull/341)
 ### Modules
 
 #### Added enhancements
diff --git a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/lablog b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/lablog
index 225026319..edc5cd0eb 100755
--- a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/lablog
+++ b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/lablog
@@ -1,4 +1,4 @@
-# module load Nextflow/22.10.1 singularity
+# module load Nextflow singularity
 
 ln -s ../00-reads/ .
 ln -s ../samples_id.txt .
@@ -28,7 +28,7 @@ cat <<EOF > sarek.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/nf-core-sarek/nf-core-sarek-3.4.2/workflow/main.nf \\
+nextflow run /data/bi/pipelines/nf-core-sarek/nf-core-sarek_3.4.4/3_4_4/main.nf \\
 	-c ../../DOC/hpc_slurm_sarek.config \\
 	--input 'samplesheet.csv' \\
 	--outdir 01-sarek \\
diff --git a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/lablog b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/lablog
index 179c74934..a7081ffef 100755
--- a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/lablog
+++ b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/lablog
@@ -42,7 +42,7 @@ cat <<EOF > sarek.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/nf-core-sarek/nf-core-sarek-3.4.2/workflow/main.nf \\
+nextflow run /data/bi/pipelines/nf-core-sarek/nf-core-sarek_3.4.4/3_4_4/main.nf \\
           -c ../../DOC/hpc_slurm_sarek.config \\
           --input 'samplesheet.csv' \\
           --outdir 01-sarek \\
diff --git a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/lablog b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/lablog
index cb6d13302..14528c4fd 100755
--- a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/lablog
+++ b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/lablog
@@ -1,4 +1,4 @@
-# module load Nextflow/22.10.1 singularity
+# module load Nextflow singularity
 
 ln -s ../00-reads/ .
 ln -s ../samples_id.txt .
@@ -44,7 +44,7 @@ cat <<EOF > sarek.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/nf-core-sarek/nf-core-sarek-3.4.2/workflow/main.nf \\
+nextflow run /data/bi/pipelines/nf-core-sarek/nf-core-sarek_3.4.4/3_4_4/main.nf \\
           -c ../../DOC/hpc_slurm_sarek.config \\
           --input 'samplesheet.csv' \\
           --outdir 01-sarek \\

From 86103794c4499a6cd87f808d2d01ef291cc660d9 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Fri, 30 Aug 2024 08:57:56 +0200
Subject: [PATCH 268/321] Created code to generate amended consensus without
 ambiguities but masked

---
 bu_isciii/templates/IRMA/DOC/irma_config.sh | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/bu_isciii/templates/IRMA/DOC/irma_config.sh b/bu_isciii/templates/IRMA/DOC/irma_config.sh
index 145da9b37..bcaba2abb 100644
--- a/bu_isciii/templates/IRMA/DOC/irma_config.sh
+++ b/bu_isciii/templates/IRMA/DOC/irma_config.sh
@@ -5,3 +5,7 @@ MATCH_PROC=8		# grid maximum processes for the MATCH
 SORT_PROC=8		# currently not used
 ALIGN_PROC=8		# grid maximum processes for the rough align
 ASSEM_PROC=8		# grid maximum processes for assembly
+
+### AMENDED CONSENSUS ###
+MIN_AMBIG=0.75          # Sets ambiguities to off
+MIN_CONS_SUPPORT=9      # Mask low coverage <= 9 (10 is ok)

From 1efabf35d96713a521e8c3a849121edcf75f566e Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Fri, 30 Aug 2024 09:00:37 +0200
Subject: [PATCH 269/321] Updated changelog

---
 CHANGELOG.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index c899f7d99..723145087 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -114,6 +114,7 @@ Code contributions to the new version:
 - Added permissions fixing after running scratch_copy, as well as a new fix-permissions module in the tools [#332](https://github.com/BU-ISCIII/buisciii-tools/pull/332).
 - Updated MAG lablogs and utils.py [#334](https://github.com/BU-ISCIII/buisciii-tools/pull/334).
 - Updated some files (setup.py, __main__.py, README, etc) for the 2.2.0 release [#335](https://github.com/BU-ISCIII/buisciii-tools/pull/335).
+- Fixed IRMAs config for amended consensus [#325](https://github.com/BU-ISCIII/buisciii-tools/pull/325).
 
 ### Modules
 

From 17c4170debed3091b96a3b4c540a04117090d411 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 19 Sep 2024 15:49:44 +0200
Subject: [PATCH 270/321] Fixd changelog

---
 CHANGELOG.md | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 723145087..8b7e3f908 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -9,12 +9,16 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 ### Credits
 
 Code contributions to the new version:
-- [Daniel Valle](https://github.com/Daniel-VM)
 
+- [Daniel Valle](https://github.com/Daniel-VM)
+- [Sarai Varona](https://github.com/svarona)
 
 ### Template fixes and updates
+
 - Fixed path to blast database and update Emmtyper params [#339](https://github.com/BU-ISCIII/buisciii-tools/pull/339)
 - Updated sarek version (v3.4.4) in ExomeEB-ExomeTrio-WGSTrio templates [#341] (https://github.com/BU-ISCIII/buisciii-tools/pull/341)
+- Fixed IRMAs config for amended consensus [#325](https://github.com/BU-ISCIII/buisciii-tools/pull/325).
+
 ### Modules
 
 #### Added enhancements
@@ -114,7 +118,6 @@ Code contributions to the new version:
 - Added permissions fixing after running scratch_copy, as well as a new fix-permissions module in the tools [#332](https://github.com/BU-ISCIII/buisciii-tools/pull/332).
 - Updated MAG lablogs and utils.py [#334](https://github.com/BU-ISCIII/buisciii-tools/pull/334).
 - Updated some files (setup.py, __main__.py, README, etc) for the 2.2.0 release [#335](https://github.com/BU-ISCIII/buisciii-tools/pull/335).
-- Fixed IRMAs config for amended consensus [#325](https://github.com/BU-ISCIII/buisciii-tools/pull/325).
 
 ### Modules
 

From 6bbc75a1035019c3f650cb562abe34fb64637afd Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 19 Sep 2024 15:50:58 +0200
Subject: [PATCH 271/321] Created postprocessing script for amended files

---
 .../04-irma/postprocessing.sh                 | 71 +++++++++++++++++++
 1 file changed, 71 insertions(+)
 create mode 100644 bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/postprocessing.sh

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/postprocessing.sh b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/postprocessing.sh
new file mode 100644
index 000000000..051b61177
--- /dev/null
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/postprocessing.sh
@@ -0,0 +1,71 @@
+#CLEAN
+if test -f all_samples_completo.txt; then rm all_samples_completo.txt; fi
+if test -d A_*; then rm -rf A_*; fi
+if test -d B; then rm -rf B; fi
+if test -d C; then rm -rf C; fi
+if test -d D; then rm -rf D; fi
+
+cat ../samples_id.txt | while read sample; do
+    FLUSUBTYPE=$(ls ${sample}/*H*.fasta | cut -d '/' -f2 | cut -d '.' -f1 | cut -d '_' -f1,3 | sort -u)
+    FLUTYPE=$(ls ${sample}/*H*.fasta | cut -d '/' -f2 | cut -d '.' -f1 | cut -d '_' -f1 | sort -u)
+    mkdir -p $FLUSUBTYPE
+    ls ${sample}/amended_consensus/*.fa | cut -d '_' -f3 | cut -d '.' -f1 | while read fragment; do
+        if [ $fragment == 1 ]; then
+            if [ $FLUTYPE == "B" ]; then
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_1/_PB1/' >> ${FLUSUBTYPE}/B_PB1.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_1/_PB1/' >> all_samples_completo.txt
+            else
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_1/_PB2/' >> ${FLUSUBTYPE}/${FLUTYPE}_PB2.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_1/_PB2/' >> all_samples_completo.txt
+            fi
+        elif [ $fragment == 2 ]; then
+            if [ $FLUTYPE == "B" ]; then
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_2/_PB2/' >> ${FLUSUBTYPE}/B_PB2.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_2/_PB2/' >> all_samples_completo.txt
+            else
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_2/_PB1/' >> ${FLUSUBTYPE}/${FLUTYPE}_PB1.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_2/_PB1/' >> all_samples_completo.txt
+            fi
+        elif [ $fragment == 3 ]; then
+            if [ $FLUTYPE == "B" ] || [ $FLUTYPE == "A" ]; then
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_3/_PA/' >> ${FLUSUBTYPE}/${FLUTYPE}_PA.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_3/_PA/' >> all_samples_completo.txt
+            else
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_3/_P3/' >> ${FLUSUBTYPE}/${FLUTYPE}_P3.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_3/_P3/' >> all_samples_completo.txt
+            fi
+        elif [ $fragment == 4 ]; then
+            if [ $FLUTYPE == "B" ] || [ $FLUTYPE == "A" ]; then
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_4/_HA/' >> ${FLUSUBTYPE}/${FLUTYPE}_HA.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_4/_HA/' >> all_samples_completo.txt
+            else
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_4/_HE/' >> ${FLUSUBTYPE}/${FLUTYPE}_HE.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_4/_HE/' >> all_samples_completo.txt
+            fi
+        elif [ $fragment == 5 ]; then
+            cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_5/_NP/' >> ${FLUSUBTYPE}/${FLUTYPE}_NP.txt
+            cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_5/_NP/' >> all_samples_completo.txt
+        elif [ $fragment == 6 ]; then
+            if [ $FLUTYPE == "B" ] || [ $FLUTYPE == "A" ]; then
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_6/_NA/' >> ${FLUSUBTYPE}/${FLUTYPE}_NA.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_6/_NA/' >> all_samples_completo.txt
+            else
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_6/_MP/' >> ${FLUSUBTYPE}/${FLUTYPE}_MP.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_6/_MP/' >> all_samples_completo.txt
+            fi
+        elif [ $fragment == 7 ]; then
+            if [ $FLUTYPE == "B" ] || [ $FLUTYPE == "A" ]; then
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_7/_MP/' >> ${FLUSUBTYPE}/${FLUTYPE}_MP.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_7/_MP/' >> all_samples_completo.txt
+            else
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_7/_NS/' >> ${FLUSUBTYPE}/${FLUTYPE}_NS.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_7/_NS/' >> all_samples_completo.txt
+            fi
+        elif [ $fragment == 8 ]; then
+            cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_8/_NS/' >> ${FLUSUBTYPE}/${FLUTYPE}_NS.txt
+            cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_8/_NS/' >> all_samples_completo.txt
+        else
+            echo "The sample $sample has a segment with number $fragment, but I don't know which segment it is."
+        fi
+    done
+done

From f61fb26fce2256222b62f893a073073fd0ee9794 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 19 Sep 2024 15:51:08 +0200
Subject: [PATCH 272/321] included postprocessing script in lablog

---
 .../ANALYSIS01_FLU_IRMA/04-irma/lablog        | 29 ++-----------------
 1 file changed, 2 insertions(+), 27 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
index 5e9d933b6..be910a9e0 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
@@ -9,31 +9,6 @@ cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --cpu
 
 echo 'bash create_irma_stats.sh' > _02_create_stats.sh
 
-echo "ls */*HA*.fasta | cut -d '/' -f2 | cut -d '.' -f1 | sort -u | cut -d '_' -f3  | sed '/^\$/d' | sed 's/^/A_/g' > HA_types.txt" > _03_post_processing.sh
+echo 'bash postprocessing.sh' > _03_post_processing.sh
 
-echo 'cat HA_types.txt | while read type; do if test -d ${type}; then rm -rf ${type}; fi; done; if test -d B ; then rm -rf B; fi; if test -d C; then rm -rf C; fi' >> _03_post_processing.sh
-
-echo 'if test -f all_samples_completo.txt; then rm all_samples_completo.txt; fi' >> _03_post_processing.sh
-
-echo "cat HA_types.txt | while read in; do mkdir \${in}; done" >> _03_post_processing.sh
-
-echo "if grep -qw 'B__' irma_stats.txt; then mkdir B; fi" >> _03_post_processing.sh
-
-echo "if grep -qw 'C__' irma_stats.txt; then mkdir C; fi" >> _03_post_processing.sh
-
-echo "ls */*.fasta | cut -d '/' -f2 | cut -d '.' -f1 | cut -d '_' -f1,2 | sort -u | grep 'A_' > A_fragment_list.txt" >> _03_post_processing.sh
-
-echo "ls */*.fasta | cut -d '/' -f2 | cut -d '.' -f1 | cut -d '_' -f1,2 | sort -u | grep 'B_' > B_fragment_list.txt" >> _03_post_processing.sh
-
-echo "ls */*.fasta | cut -d '/' -f2 | cut -d '.' -f1 | cut -d '_' -f1,2 | sort -u | grep 'C_' > C_fragment_list.txt" >> _03_post_processing.sh
-
-echo 'cat HA_types.txt | while read type; do grep ${type} irma_stats.txt | cut -f1 | while read sample; do cat A_fragment_list.txt | while read fragment; do if test -f ${sample}/${fragment}*.fasta; then cat ${sample}/${fragment}*.fasta | sed "s/^>/\>${sample}_/g" | sed 's/_H1//g' | sed 's/_H3//g' | sed 's/_N1//g' | sed 's/_N2//g' | sed s@-@/@g | sed s/_A_/_/g ; fi >> ${type}/${fragment}.txt; done; done; done' >> _03_post_processing.sh
-
-echo 'grep -w 'B__' irma_stats.txt | cut -f1 | while read sample; do cat B_fragment_list.txt | while read fragment; do if test -f ${sample}/${fragment}*.fasta; then cat ${sample}/${fragment}*.fasta | sed "s/^>/\>${sample}_/g" | sed s/_H1//g | sed s/_H3//g | sed s/_N1//g | sed s/_N2//g | sed s@-@/@g | sed s/_B_/_/g ; fi >> B/${fragment}.txt; done; done' >> _03_post_processing.sh
-
-echo 'grep -w 'C__' irma_stats.txt | cut -f1 | while read sample; do cat C_fragment_list.txt | while read fragment; do if test -f ${sample}/${fragment}*.fasta; then cat ${sample}/${fragment}*.fasta | sed "s/^>/\>${sample}_/g" | sed s/_H1//g | sed s/_H3//g | sed s/_N1//g | sed s/_N2//g | sed s@-@/@g | sed s/_C_/_/g ; fi >> C/${fragment}.txt; done; done' >> _03_post_processing.sh
-
-echo 'cat ../samples_id.txt | while read in; do cat ${in}/*.fasta | sed "s/^>/\>${in}_/g" | sed 's/_H1//g' | sed 's/_H3//g' | sed 's/_N1//g' | sed 's/_N2//g' | sed 's@-@/@g' | sed 's/_A_/_/g' | sed 's/_B_/_/g' | sed 's/_C_/_/g' >> all_samples_completo.txt; done' >> _03_post_processing.sh
-
-echo 'sed "s/__//g" irma_stats.txt > clean_irma_stats.txt' >> _03_post_processing.sh
-echo 'sed "s/_\t/\t/g" irma_stats.txt > clean_irma_stats.txt' >> _03_post_processing.sh
+echo 'sed "s/__//g" irma_stats.txt | sed "s/_\t/\t/g" > clean_irma_stats.txt' >> _03_post_processing.sh

From 9b82b761759ffbfc4f51f592113b7e50dc48c310 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 19 Sep 2024 16:37:14 +0200
Subject: [PATCH 273/321] Shortened code to look better

---
 .../04-irma/postprocessing.sh                 | 42 +++++++------------
 1 file changed, 14 insertions(+), 28 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/postprocessing.sh b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/postprocessing.sh
index 051b61177..2ef0e02cf 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/postprocessing.sh
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/postprocessing.sh
@@ -12,58 +12,44 @@ cat ../samples_id.txt | while read sample; do
     ls ${sample}/amended_consensus/*.fa | cut -d '_' -f3 | cut -d '.' -f1 | while read fragment; do
         if [ $fragment == 1 ]; then
             if [ $FLUTYPE == "B" ]; then
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_1/_PB1/' >> ${FLUSUBTYPE}/B_PB1.txt
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_1/_PB1/' >> all_samples_completo.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_1/_PB1/' | tee -a ${FLUSUBTYPE}/B_PB1.txt all_samples_completo.txt > /dev/null
             else
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_1/_PB2/' >> ${FLUSUBTYPE}/${FLUTYPE}_PB2.txt
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_1/_PB2/' >> all_samples_completo.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_1/_PB2/' | tee -a ${FLUSUBTYPE}/${FLUTYPE}_PB2.txt all_samples_completo.txt > /dev/null
             fi
         elif [ $fragment == 2 ]; then
             if [ $FLUTYPE == "B" ]; then
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_2/_PB2/' >> ${FLUSUBTYPE}/B_PB2.txt
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_2/_PB2/' >> all_samples_completo.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_2/_PB2/' | tee -a ${FLUSUBTYPE}/B_PB2.txt all_samples_completo.txt > /dev/null
             else
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_2/_PB1/' >> ${FLUSUBTYPE}/${FLUTYPE}_PB1.txt
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_2/_PB1/' >> all_samples_completo.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_2/_PB1/' | tee -a ${FLUSUBTYPE}/${FLUTYPE}_PB1.txt all_samples_completo.txt > /dev/null
             fi
         elif [ $fragment == 3 ]; then
             if [ $FLUTYPE == "B" ] || [ $FLUTYPE == "A" ]; then
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_3/_PA/' >> ${FLUSUBTYPE}/${FLUTYPE}_PA.txt
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_3/_PA/' >> all_samples_completo.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_3/_PA/' | tee -a ${FLUSUBTYPE}/${FLUTYPE}_PA.txt all_samples_completo.txt > /dev/null
             else
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_3/_P3/' >> ${FLUSUBTYPE}/${FLUTYPE}_P3.txt
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_3/_P3/' >> all_samples_completo.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_3/_P3/' | tee -a ${FLUSUBTYPE}/${FLUTYPE}_P3.txt all_samples_completo.txt > /dev/null
             fi
         elif [ $fragment == 4 ]; then
             if [ $FLUTYPE == "B" ] || [ $FLUTYPE == "A" ]; then
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_4/_HA/' >> ${FLUSUBTYPE}/${FLUTYPE}_HA.txt
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_4/_HA/' >> all_samples_completo.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_4/_HA/' | tee -a ${FLUSUBTYPE}/${FLUTYPE}_HA.txt all_samples_completo.txt > /dev/null
             else
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_4/_HE/' >> ${FLUSUBTYPE}/${FLUTYPE}_HE.txt
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_4/_HE/' >> all_samples_completo.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_4/_HE/' | tee -a ${FLUSUBTYPE}/${FLUTYPE}_HE.txt all_samples_completo.txt > /dev/null
             fi
         elif [ $fragment == 5 ]; then
-            cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_5/_NP/' >> ${FLUSUBTYPE}/${FLUTYPE}_NP.txt
-            cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_5/_NP/' >> all_samples_completo.txt
+            cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_5/_NP/' | tee -a ${FLUSUBTYPE}/${FLUTYPE}_NP.txt all_samples_completo.txt > /dev/null
         elif [ $fragment == 6 ]; then
             if [ $FLUTYPE == "B" ] || [ $FLUTYPE == "A" ]; then
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_6/_NA/' >> ${FLUSUBTYPE}/${FLUTYPE}_NA.txt
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_6/_NA/' >> all_samples_completo.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_6/_NA/' | tee -a ${FLUSUBTYPE}/${FLUTYPE}_NA.txt all_samples_completo.txt > /dev/null
             else
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_6/_MP/' >> ${FLUSUBTYPE}/${FLUTYPE}_MP.txt
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_6/_MP/' >> all_samples_completo.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_6/_MP/' | tee -a ${FLUSUBTYPE}/${FLUTYPE}_MP.txt all_samples_completo.txt > /dev/null
             fi
         elif [ $fragment == 7 ]; then
             if [ $FLUTYPE == "B" ] || [ $FLUTYPE == "A" ]; then
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_7/_MP/' >> ${FLUSUBTYPE}/${FLUTYPE}_MP.txt
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_7/_MP/' >> all_samples_completo.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_7/_MP/' | tee -a ${FLUSUBTYPE}/${FLUTYPE}_MP.txt all_samples_completo.txt > /dev/null
             else
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_7/_NS/' >> ${FLUSUBTYPE}/${FLUTYPE}_NS.txt
-                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_7/_NS/' >> all_samples_completo.txt
+                cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_7/_NS/' | tee -a ${FLUSUBTYPE}/${FLUTYPE}_NS.txt all_samples_completo.txt > /dev/null
             fi
         elif [ $fragment == 8 ]; then
-            cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_8/_NS/' >> ${FLUSUBTYPE}/${FLUTYPE}_NS.txt
-            cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_8/_NS/' >> all_samples_completo.txt
+            cat ${sample}/amended_consensus/*_${fragment}.fa | sed 's/-/\//g' | sed 's/_8/_NS/' | tee -a ${FLUSUBTYPE}/${FLUTYPE}_NS.txt all_samples_completo.txt > /dev/null
         else
             echo "The sample $sample has a segment with number $fragment, but I don't know which segment it is."
         fi

From 7de042bc9bdced20302d6b74bd01d01da6f61348 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 30 Sep 2024 16:42:43 +0200
Subject: [PATCH 274/321] Updated the 03-annotation/lablogs in exomeeb,
 exometrio and wgstrio services to have all the necessary -bind routes

---
 .../exomeeb/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog      | 2 +-
 .../exometrio/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog    | 2 +-
 .../wgstrio/ANALYSIS/ANALYSIS01_GENOME/03-annotation/lablog     | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
index 61892d9bb..ef8d93adb 100644
--- a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
+++ b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
@@ -22,7 +22,7 @@ echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output
 
 ## 4-5. Lablog for annotating whole genome samples using Variant Effect Predictor (VEP).
 
-echo "srun --partition short_idx --mem 100G --time 4:00:00 --chdir ${scratch_dir} --output logs/VEP.log --job-name VEP singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/ensembl-vep:103.1--pl5262h4a94de4_2 vep --fasta /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta -i ${scratch_dir}/vep/variants_fil_mod.vcf -o ${scratch_dir}/vep/vep_annot.vcf --cache --offline --dir_cache /data/bi/references/eukaria/homo_sapiens/cache_vep/ --everything --dir_plugins /data/bi/references/eukaria/homo_sapiens/cache_vep/Plugins/ --assembly GRCh37 --tab --plugin dbNSFP,/data/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37/dbNSFP4.1a_grch37.gz,clinvar_id,clinvar_trait,clinvar_OMIM_id,clinvar_Orphanet_id,HGVSc_snpEff,HGVSp_snpEff,SIFT_score,SIFT_pred,Polyphen2_HDIV_score,Polyphen2_HDIV_pred,Polyphen2_HVAR_score,Polyphen2_HVAR_pred,MutationTaster_score,MutationTaster_pred,MutationAssessor_score,MutationAssessor_pred,FATHMM_score,FATHMM_pred,PROVEAN_score,PROVEAN_pred,VEST4_score,MetaSVM_score,MetaSVM_pred,MetaLR_score,MetaLR_pred,CADD_raw,CADD_phred,CADD_raw_hg19,CADD_phred_hg19,GERP++_NR,GERP++_RS,phyloP100way_vertebrate,phastCons100way_vertebrate &" > _02_vep_annotation.sh
+echo "srun --partition short_idx --mem 100G --time 4:00:00 --chdir ${scratch_dir} --output logs/VEP.log --job-name VEP singularity exec -B /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/ -B /data/bi/references/eukaria/homo_sapiens/cache_vep/homo_sapiens -B /data/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37/ -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/ensembl-vep:103.1--pl5262h4a94de4_2 vep --fasta /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta -i ${scratch_dir}/vep/variants_fil_mod.vcf -o ${scratch_dir}/vep/vep_annot.vcf --cache --offline --dir_cache /data/bi/references/eukaria/homo_sapiens/cache_vep/ --everything --dir_plugins /data/bi/references/eukaria/homo_sapiens/cache_vep/Plugins/ --assembly GRCh37 --tab --plugin dbNSFP,/data/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37/dbNSFP4.1a_grch37.gz,clinvar_id,clinvar_trait,clinvar_OMIM_id,clinvar_Orphanet_id,HGVSc_snpEff,HGVSp_snpEff,SIFT_score,SIFT_pred,Polyphen2_HDIV_score,Polyphen2_HDIV_pred,Polyphen2_HVAR_score,Polyphen2_HVAR_pred,MutationTaster_score,MutationTaster_pred,MutationAssessor_score,MutationAssessor_pred,FATHMM_score,FATHMM_pred,PROVEAN_score,PROVEAN_pred,VEST4_score,MetaSVM_score,MetaSVM_pred,MetaLR_score,MetaLR_pred,CADD_raw,CADD_phred,CADD_raw_hg19,CADD_phred_hg19,GERP++_NR,GERP++_RS,phyloP100way_vertebrate,phastCons100way_vertebrate &" > _02_vep_annotation.sh
 
 echo "grep -v '^##' ./vep/vep_annot.vcf > ./vep/vep_annot_head.txt" > _03_merge_data1.sh
 echo "sed -i 's/#Uploaded_variation/ID/' ./vep/vep_annot_head.txt" >> _03_merge_data1.sh
diff --git a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
index 063393c2b..e771e6dcd 100644
--- a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
+++ b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
@@ -28,7 +28,7 @@ echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output
 # 3. Lablog for annotating whole genome samples using Variant Effect Predictor (VEP).
 # Run Vep without the plugin columns
 
-echo "srun --partition short_idx --mem 100G --time 12:00:00 --chdir ${scratch_dir} --output logs/VEP.log --job-name VEP singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/ensembl-vep:103.1--pl5262h4a94de4_2 vep --fasta /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta -i ${scratch_dir}/vep/variants_fil_mod.vcf -o ${scratch_dir}/vep/vep_annot.vcf --cache --offline --dir_cache /data/bi/references/eukaria/homo_sapiens/cache_vep/ --everything --assembly GRCh37 --tab &" > _02_vep_annotation.sh
+echo "srun --partition short_idx --mem 100G --time 12:00:00 --chdir ${scratch_dir} --output logs/VEP.log --job-name VEP singularity exec -B /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome -B /data/bi/references/eukaria/homo_sapiens/cache_vep -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/ensembl-vep:103.1--pl5262h4a94de4_2 vep --fasta /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta -i ${scratch_dir}/vep/variants_fil_mod.vcf -o ${scratch_dir}/vep/vep_annot.vcf --cache --offline --dir_cache /data/bi/references/eukaria/homo_sapiens/cache_vep/ --everything --assembly GRCh37 --tab &" > _02_vep_annotation.sh
 
 #--------------------------------------------------------------------------------------------------------------------
 
diff --git a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/03-annotation/lablog b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/03-annotation/lablog
index 50d87f79f..c6a964bd1 100644
--- a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/03-annotation/lablog
+++ b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/03-annotation/lablog
@@ -31,7 +31,7 @@ echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output
 
 # Run Vep without the plugin columns
 
-echo "srun --partition short_idx --mem 100G --time 12:00:00 --chdir ${scratch_dir} --output logs/VEP.log --job-name VEP singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/ensembl-vep:103.1--pl5262h4a94de4_2 vep --fasta /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta -i ${scratch_dir}/vep/variants_fil_mod.vcf -o ${scratch_dir}/vep/vep_annot.vcf --cache --offline --dir_cache /data/bi/references/eukaria/homo_sapiens/cache_vep/ --everything --assembly GRCh37 --tab &" > _02_vep_annotation.sh
+echo "srun --partition short_idx --mem 100G --time 12:00:00 --chdir ${scratch_dir} --output logs/VEP.log --job-name VEP singularity exec -B /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/ -B /data/bi/references/eukaria/homo_sapiens/cache_vep/ -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/ensembl-vep:103.1--pl5262h4a94de4_2 vep --fasta /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta -i ${scratch_dir}/vep/variants_fil_mod.vcf -o ${scratch_dir}/vep/vep_annot.vcf --cache --offline --dir_cache /data/bi/references/eukaria/homo_sapiens/cache_vep/ --everything --assembly GRCh37 --tab &" > _02_vep_annotation.sh
 
 #--------------------------------------------------------------------------------------------------------------------
 

From 9bdafedd248f0b6682f1661dafbada4e977421d9 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 30 Sep 2024 16:50:49 +0200
Subject: [PATCH 275/321] Updated bioinfo_doc.py to allow more options when
 creating the delivery email

---
 bu_isciii/bioinfo_doc.py | 30 +++++++++++++++++++++++++++---
 1 file changed, 27 insertions(+), 3 deletions(-)
 mode change 100755 => 100644 bu_isciii/bioinfo_doc.py

diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
old mode 100755
new mode 100644
index 4da846728..458dd8999
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -646,10 +646,34 @@ def email_creation(self):
                     email_data["email_notes"] = self.delivery_notes.replace(
                         "\n", "<br />"
                     )
+                else:
+                    email_data["email_notes"] = bu_isciii.utils.ask_for_some_text(
+                        msg="Write email notes"
+                    ).replace("\n", "<br />")
             else:
-                email_data["email_notes"] = bu_isciii.utils.ask_for_some_text(
-                    msg="Write email notes"
-                ).replace("\n", "<br />")
+                if bu_isciii.utils.prompt_yn_question(
+                    msg="Do you wish to provide a text file for email notes?", dflt=False
+                ):
+                    for i in range(3, -1, -1):
+                        email_data["email_notes"] = bu_isciii.utils.prompt_path(
+                            msg="Write the path to the file with RAW text as email notes"
+                        )
+                        if not os.path.isfile(os.path.expanduser(email_data["email_notes"])):
+                            stderr.print(f"Provided file doesn't exist. Attempts left: {i}")
+                        else:
+                            stderr.print(f"File selected: {email_data["email_notes"]}")
+                            break
+                    else:
+                        stderr.print("No more attempts. Email notes will be given by prompt")
+                        email_data["email_notes"] = None
+                else:
+                    email_data["email_notes"] = None
+
+                if email_data["email_notes"]:
+                    with open(os.path.expanduser(email_data["email_notes"])) as f:
+                        email_data["email_notes"] = f.read().replace("\n", "<br />")
+                else:
+                    email_data["email_notes"] = bu_isciii.utils.ask_for_some_text(msg="Write email notes").replace("\n", "<br />")
 
         email_data["user_data"] = self.resolution_info["service_user_id"]
         email_data["service_id"] = self.service_name.split("_", 5)[0]

From 78bc8e71fe21272c22d2c00718600f3209200045 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 30 Sep 2024 16:54:57 +0200
Subject: [PATCH 276/321] Updated excel_generator.py to be more informative

---
 .../viralrecon/RESULTS/excel_generator.py     | 32 ++++++++++++-------
 1 file changed, 20 insertions(+), 12 deletions(-)

diff --git a/bu_isciii/templates/viralrecon/RESULTS/excel_generator.py b/bu_isciii/templates/viralrecon/RESULTS/excel_generator.py
index 8467c414d..ffeece399 100755
--- a/bu_isciii/templates/viralrecon/RESULTS/excel_generator.py
+++ b/bu_isciii/templates/viralrecon/RESULTS/excel_generator.py
@@ -68,7 +68,7 @@ def merge_lineage_tables(
                 csvs_in_folder=csvs_in_folder, merged_csv_name=merged_csv_name
             )
         else:
-            print(f"No pangolin folder could be found for {ref}, omitting")
+            print(f"\033[93mNo pangolin folder could be found for {ref}, omitting\033[0m")
 
         if os.path.isdir(os.path.abspath(folder + "/nextclade")):
             nextcl_dir = os.path.join(folder, "nextclade")
@@ -82,17 +82,18 @@ def merge_lineage_tables(
                 csvs_in_folder=csvs_in_folder, merged_csv_name=merged_csv_name
             )
         else:
-            print(f"No nextclade folder could be found for {ref}, omitting")
+            print(f"\033[93mNo nextclade folder could be found for {ref}, omitting\033[0m\n")
 
     return
 
 
 def excel_generator(csv_files: List[str]):
+    #print("Proceeding")
     for file in csv_files:
         if not os.path.exists(file):
-            print(f"File {file} does not exist, omitting...")
+            print(f"\033[91mFile {file} does not exist, omitting...\033[0m")
             continue
-        print(f"Generating excel file for {file}")
+        print(f"\033[92mGenerating excel file for {file}\033[0m")
         output_name = os.path.splitext(os.path.basename(file))[0] + ".xlsx"
         # workbook = openpyxl.Workbook(output_name)
         if "nextclade" in str(file):
@@ -108,7 +109,7 @@ def excel_generator(csv_files: List[str]):
             try:
                 table = pd.read_csv(file)
             except pd.errors.EmptyDataError:
-                print("Could not parse table from ", str(file))
+                print("\033[91mCould not parse table from ", str(file), "\033[0m")
                 continue
         table = table.drop(["index"], axis=1, errors="ignore")
         table.to_excel(output_name, index=False)
@@ -119,22 +120,22 @@ def single_csv_to_excel(csv_file: str):
     try:
         excel_generator([csv_file])
     except FileNotFoundError as e:
-        print(f"Could not find file {e}")
+        print(f"\033[91mCould not find file {e}\033[0m")
 
 
 def main(args):
     if args.single_csv:
         # If single_csv is called, just convert target csv to excel and skip the rest
-        print("Single file convertion selected. Skipping main process...")
+        print("\033[92mSingle file convertion selected. Skipping main process...\033[0m")
         single_csv_to_excel(args.single_csv)
         exit(0)
 
     print(
-        "Extracting references used for analysis and the samples associated with each reference\n"
+        "\033[92mExtracting references used for analysis and the samples associated with each reference\033[0m"
     )
     with open(args.reference_file, "r") as file:
         references = [line.rstrip() for line in file]
-        print(f"\nFound {len(references)} references: {str(references).strip('[]')}")
+        print(f"\n\033[92mFound {len(references)} references: {str(references).strip('[]')}\033[0m")
 
     reference_folders = {ref: str("excel_files_" + ref) for ref in references}
     samples_ref_files = {
@@ -145,7 +146,7 @@ def main(args):
         # Merge pangolin and nextclade csv files separatedly and create excel files for them
         merge_lineage_tables(reference_folders, samples_ref_files)
         for reference, folder in reference_folders.items():
-            print(f"Creating excel files for reference {reference}")
+            print(f"\033[92mCreating excel files for reference {reference}\033[0m")
             csv_files = [
                 file.path for file in os.scandir(folder) if file.path.endswith(".csv")
             ]
@@ -160,8 +161,9 @@ def main(args):
             csvs_in_folder=variants_tables, merged_csv_name="variants_long_table.csv"
         )
     except FileNotFoundError as e:
-        print(str(e))
-        print("Merged variants_long_table.csv might be empty")
+        print("\033[93mWARNING!\033[0m")
+        print("\033[93mAt least one variants_long_table.csv file could not be found. Therefore, merged variants_long_table.csv will be incomplete.\033[0m")
+        print("\033[93mPlease, check the following report in order to know which links are broken and, therefore, which tables could not be found:\033[0m\n")
 
     # Create excel files for individual tables
     valid_extensions = [".csv", ".tsv", ".tab"]
@@ -173,6 +175,12 @@ def main(args):
     link_csvs = [file for file in rest_of_csvs if os.path.islink(file)]
     broken_links = [file for file in link_csvs if not os.path.exists(os.readlink(file))]
     valid_csvs = [file for file in rest_of_csvs if file not in broken_links]
+
+    if broken_links:
+     print(f"\033[93mWARNING! {len(broken_links)} broken links found (for .csv, .tsv or .tab files). Please fix them.\033[0m")
+     for broken_link in broken_links:
+         print(f"\033[93mBroken link: {broken_link} (target: {os.readlink(broken_link)})\033[0m")
+
     excel_generator(valid_csvs)
 
 

From c4c1704049f735afd31208b70d4533a34a46a33b Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 30 Sep 2024 16:55:21 +0200
Subject: [PATCH 277/321] Updated sftp_user.json

---
 bu_isciii/templates/sftp_user.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/sftp_user.json b/bu_isciii/templates/sftp_user.json
index bc7f4528a..344c8b49e 100755
--- a/bu_isciii/templates/sftp_user.json
+++ b/bu_isciii/templates/sftp_user.json
@@ -44,7 +44,7 @@
     "sara.perez": ["GeneticDiagnosis"],
     "sbarturen": ["Labvirushep"],
     "sergio.sanchez": ["LabFWDB_ssanchez"],
-    "sherrera": ["LabFWBD", "LabFWBD_ext"],
+    "sherrera": ["LabFWBD", "LabFWBD_ext", "Labtuberculosis"],
     "sresino": ["Labvirushep"],
     "svaldezate": ["Labtaxonomia"],
     "svazquez": ["Labvirusres"],

From 1a7cdddd98cffbd76794ccd0dbce0a52da8a5360 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 30 Sep 2024 16:56:29 +0200
Subject: [PATCH 278/321] Updated 03-MTBSeq/lablog to handle the first sample
 name appropriately

---
 .../mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog        | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
index e5bdac16e..0eff79004 100644
--- a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
+++ b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
@@ -13,9 +13,9 @@ cat ../samples_id.txt | xargs -I @@ echo -e "srun --job-name MTBSEQ.@@  --output
 
 # classification
 echo "mkdir classification_all" > _03_gather_results.sh 
-echo "FIRST_SAMPLE=$(head -n1 ../samples_id.txt); head -n 1 ${FIRST_SAMPLE}/Classification/Strain_Classification.tab > classification_all/strain_classification_all.tab; grep \"^'$analysis_year\" */Classification/Strain_Classification.tab | cut -d \":\" -f 2 >> classification_all/strain_classification_all.tab" >> _03_gather_results.sh
+echo 'FIRST_SAMPLE=$(head -n1 samples_id.txt); head -n 1 ${FIRST_SAMPLE}/Classification/Strain_Classification.tab > classification_all/strain_classification_all.tab; grep "^'\'''"$analysis_year"'" */Classification/Strain_Classification.tab | cut -d ":" -f 2 >> classification_all/strain_classification_all.tab' >> _03_gather_results.sh
 # resistances
 echo "mkdir resistances_all" >> _03_gather_results.sh
 cat ../samples_id.txt | xargs -I % echo "cp %/Amend/NONE_joint_cf4_cr4_fr75_ph4_samples1_amended.tab resistances_all/%_var_res.tab" >> _03_gather_results.sh
 # stats
-echo "mkdir stats_all; FIRST_SAMPLE=$(head -n1 ../samples_id.txt); head -n 1 ${FIRST_SAMPLE}/Statistics/Mapping_and_Variant_Statistics.tab > stats_all/statistics_all.tab; grep \"^'$analysis_year\" */Statistics/Mapping_and_Variant_Statistics.tab | cut -d \":\" -f 2 >> stats_all/statistics_all.tab" >> _03_gather_results.sh
+echo 'mkdir stats_all; FIRST_SAMPLE=$(head -n1 ../samples_id.txt); head -n 1 ${FIRST_SAMPLE}/Statistics/Mapping_and_Variant_Statistics.tab > stats_all/statistics_all.tab; grep "^'\'''"$analysis_year"'" */Statistics/Mapping_and_Variant_Statistics.tab | cut -d ":" -f 2 >> stats_all/statistics_all.tab' >> _03_gather_results.sh

From 3c4a1b71f93f35b3d7fa8bb14df9242fff83be29 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 30 Sep 2024 17:16:18 +0200
Subject: [PATCH 279/321] Fixed linting mistakes

---
 bu_isciii/bioinfo_doc.py                      | 21 +++++++---
 .../viralrecon/RESULTS/excel_generator.py     | 38 +++++++++++++------
 2 files changed, 42 insertions(+), 17 deletions(-)

diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index 458dd8999..519cb382d 100644
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -652,19 +652,26 @@ def email_creation(self):
                     ).replace("\n", "<br />")
             else:
                 if bu_isciii.utils.prompt_yn_question(
-                    msg="Do you wish to provide a text file for email notes?", dflt=False
+                    msg="Do you wish to provide a text file for email notes?",
+                    dflt=False,
                 ):
                     for i in range(3, -1, -1):
                         email_data["email_notes"] = bu_isciii.utils.prompt_path(
                             msg="Write the path to the file with RAW text as email notes"
                         )
-                        if not os.path.isfile(os.path.expanduser(email_data["email_notes"])):
-                            stderr.print(f"Provided file doesn't exist. Attempts left: {i}")
+                        if not os.path.isfile(
+                            os.path.expanduser(email_data["email_notes"])
+                        ):
+                            stderr.print(
+                                f"Provided file doesn't exist. Attempts left: {i}"
+                            )
                         else:
-                            stderr.print(f"File selected: {email_data["email_notes"]}")
+                            stderr.print(f"File selected: {email_data['email_notes']}")
                             break
                     else:
-                        stderr.print("No more attempts. Email notes will be given by prompt")
+                        stderr.print(
+                            "No more attempts. Email notes will be given by prompt"
+                        )
                         email_data["email_notes"] = None
                 else:
                     email_data["email_notes"] = None
@@ -673,7 +680,9 @@ def email_creation(self):
                     with open(os.path.expanduser(email_data["email_notes"])) as f:
                         email_data["email_notes"] = f.read().replace("\n", "<br />")
                 else:
-                    email_data["email_notes"] = bu_isciii.utils.ask_for_some_text(msg="Write email notes").replace("\n", "<br />")
+                    email_data["email_notes"] = bu_isciii.utils.ask_for_some_text(
+                        msg="Write email notes"
+                    ).replace("\n", "<br />")
 
         email_data["user_data"] = self.resolution_info["service_user_id"]
         email_data["service_id"] = self.service_name.split("_", 5)[0]
diff --git a/bu_isciii/templates/viralrecon/RESULTS/excel_generator.py b/bu_isciii/templates/viralrecon/RESULTS/excel_generator.py
index ffeece399..2cdb83b41 100755
--- a/bu_isciii/templates/viralrecon/RESULTS/excel_generator.py
+++ b/bu_isciii/templates/viralrecon/RESULTS/excel_generator.py
@@ -68,7 +68,9 @@ def merge_lineage_tables(
                 csvs_in_folder=csvs_in_folder, merged_csv_name=merged_csv_name
             )
         else:
-            print(f"\033[93mNo pangolin folder could be found for {ref}, omitting\033[0m")
+            print(
+                f"\033[93mNo pangolin folder could be found for {ref}, omitting\033[0m"
+            )
 
         if os.path.isdir(os.path.abspath(folder + "/nextclade")):
             nextcl_dir = os.path.join(folder, "nextclade")
@@ -82,13 +84,15 @@ def merge_lineage_tables(
                 csvs_in_folder=csvs_in_folder, merged_csv_name=merged_csv_name
             )
         else:
-            print(f"\033[93mNo nextclade folder could be found for {ref}, omitting\033[0m\n")
+            print(
+                f"\033[93mNo nextclade folder could be found for {ref}, omitting\033[0m\n"
+            )
 
     return
 
 
 def excel_generator(csv_files: List[str]):
-    #print("Proceeding")
+    # print("Proceeding")
     for file in csv_files:
         if not os.path.exists(file):
             print(f"\033[91mFile {file} does not exist, omitting...\033[0m")
@@ -126,7 +130,9 @@ def single_csv_to_excel(csv_file: str):
 def main(args):
     if args.single_csv:
         # If single_csv is called, just convert target csv to excel and skip the rest
-        print("\033[92mSingle file convertion selected. Skipping main process...\033[0m")
+        print(
+            "\033[92mSingle file convertion selected. Skipping main process...\033[0m"
+        )
         single_csv_to_excel(args.single_csv)
         exit(0)
 
@@ -135,7 +141,9 @@ def main(args):
     )
     with open(args.reference_file, "r") as file:
         references = [line.rstrip() for line in file]
-        print(f"\n\033[92mFound {len(references)} references: {str(references).strip('[]')}\033[0m")
+        print(
+            f"\n\033[92mFound {len(references)} references: {str(references).strip('[]')}\033[0m"
+        )
 
     reference_folders = {ref: str("excel_files_" + ref) for ref in references}
     samples_ref_files = {
@@ -160,10 +168,14 @@ def main(args):
         concat_tables_and_write(
             csvs_in_folder=variants_tables, merged_csv_name="variants_long_table.csv"
         )
-    except FileNotFoundError as e:
+    except FileNotFoundError:
         print("\033[93mWARNING!\033[0m")
-        print("\033[93mAt least one variants_long_table.csv file could not be found. Therefore, merged variants_long_table.csv will be incomplete.\033[0m")
-        print("\033[93mPlease, check the following report in order to know which links are broken and, therefore, which tables could not be found:\033[0m\n")
+        print(
+            "\033[93mAt least one variants_long_table.csv file could not be found. Therefore, merged variants_long_table.csv will be incomplete.\033[0m"
+        )
+        print(
+            "\033[93mPlease, check the following report in order to know which links are broken and, therefore, which tables could not be found:\033[0m\n"
+        )
 
     # Create excel files for individual tables
     valid_extensions = [".csv", ".tsv", ".tab"]
@@ -177,9 +189,13 @@ def main(args):
     valid_csvs = [file for file in rest_of_csvs if file not in broken_links]
 
     if broken_links:
-     print(f"\033[93mWARNING! {len(broken_links)} broken links found (for .csv, .tsv or .tab files). Please fix them.\033[0m")
-     for broken_link in broken_links:
-         print(f"\033[93mBroken link: {broken_link} (target: {os.readlink(broken_link)})\033[0m")
+        print(
+            f"\033[93mWARNING! {len(broken_links)} broken links found (for .csv, .tsv or .tab files). Please fix them.\033[0m"
+        )
+        for broken_link in broken_links:
+            print(
+                f"\033[93mBroken link: {broken_link} (target: {os.readlink(broken_link)})\033[0m"
+            )
 
     excel_generator(valid_csvs)
 

From 9ae84d85b4c67645b261a8eec8ef2f3dba800799 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 1 Oct 2024 12:05:50 +0200
Subject: [PATCH 280/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 37 ++++++++++++++++++++++++++++++-------
 1 file changed, 30 insertions(+), 7 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 8b7e3f908..b76da9b9a 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -10,15 +10,8 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 
 Code contributions to the new version:
 
-- [Daniel Valle](https://github.com/Daniel-VM)
-- [Sarai Varona](https://github.com/svarona)
-
 ### Template fixes and updates
 
-- Fixed path to blast database and update Emmtyper params [#339](https://github.com/BU-ISCIII/buisciii-tools/pull/339)
-- Updated sarek version (v3.4.4) in ExomeEB-ExomeTrio-WGSTrio templates [#341] (https://github.com/BU-ISCIII/buisciii-tools/pull/341)
-- Fixed IRMAs config for amended consensus [#325](https://github.com/BU-ISCIII/buisciii-tools/pull/325).
-
 ### Modules
 
 #### Added enhancements
@@ -51,6 +44,36 @@ Code contributions to the hotfix:
 
 ### Requirements
 
+## [2.2.1] - 2024-10-01 : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.2.1
+
+### Credits
+
+Code contributions to the new version:
+
+- [Daniel Valle](https://github.com/Daniel-VM)
+- [Sarai Varona](https://github.com/svarona)
+- [Victor Lopez](https://github.com/victor5lm)
+- [Sergio Olmos](https://github.com/OPSergio)
+
+### Template fixes and updates
+
+- Fixed path to blast database and update Emmtyper params [#339](https://github.com/BU-ISCIII/buisciii-tools/pull/339)
+- Updated sarek version (v3.4.4) in ExomeEB-ExomeTrio-WGSTrio templates [#341] (https://github.com/BU-ISCIII/buisciii-tools/pull/341)
+- Fixed IRMAs config for amended consensus [#325](https://github.com/BU-ISCIII/buisciii-tools/pull/325).
+- Improved excel_generator.py and bioinfo_doc.py email creation function, and updated sftp_user.json, setup.py, main.py and some lablogs [#344](https://github.com/BU-ISCIII/buisciii-tools/pull/344).
+
+### Modules
+
+#### Added enhancements
+
+#### Fixes
+
+#### Changed
+
+#### Removed
+
+### Requirements
+
 ## [2.2.0] - 2024-09-12 : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.2.0
 
 ### Credits

From b9c628f4c53ac1234d648a885130f3678d285c44 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 1 Oct 2024 12:06:07 +0200
Subject: [PATCH 281/321] Updated setup.py

---
 setup.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/setup.py b/setup.py
index efa93a594..50fdff3dc 100755
--- a/setup.py
+++ b/setup.py
@@ -2,7 +2,7 @@
 
 from setuptools import setup, find_packages
 
-version = "2.2.0"
+version = "2.2.1"
 
 with open("README.md") as f:
     readme = f.read()

From f0dabc7a432dc5f45b6850c9ed986a0747b1d355 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 1 Oct 2024 12:06:22 +0200
Subject: [PATCH 282/321] Updated __main__.py

---
 bu_isciii/__main__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/__main__.py b/bu_isciii/__main__.py
index 3933a0272..1aebd7805 100755
--- a/bu_isciii/__main__.py
+++ b/bu_isciii/__main__.py
@@ -57,7 +57,7 @@ def run_bu_isciii():
     )
 
     # stderr.print("[green]                                          `._,._,'\n", highlight=False)
-    __version__ = "2.2.0"
+    __version__ = "2.2.1"
     stderr.print(
         "[grey39]    BU-ISCIII-tools version {}".format(__version__), highlight=False
     )

From 8ad81f9e66bcc401236d72f96f5148a478bcb69b Mon Sep 17 00:00:00 2001
From: "github-actions[bot]"
 <41898282+github-actions[bot]@users.noreply.github.com>
Date: Tue, 1 Oct 2024 13:36:15 +0200
Subject: [PATCH 283/321] Merge changes from main into hotfix (#195) (#346)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com>
Co-authored-by: Sara Monzón <sara.monzon.fdz@gmail.com>
Co-authored-by: Pablo Mata <76519482+Shettland@users.noreply.github.com>
Co-authored-by: Víctor López <98259577+victor5lm@users.noreply.github.com>

From 5745c4c4553ad6ffffa0afb186d3efe8badb798f Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Tue, 15 Oct 2024 13:43:25 +0200
Subject: [PATCH 284/321] Included actions to publish release to pypi

---
 .github/workflows/pypi_publish.yml | 49 ++++++++++++++++++++++++++++++
 1 file changed, 49 insertions(+)
 create mode 100755 .github/workflows/pypi_publish.yml

diff --git a/.github/workflows/pypi_publish.yml b/.github/workflows/pypi_publish.yml
new file mode 100755
index 000000000..0e47ef9b2
--- /dev/null
+++ b/.github/workflows/pypi_publish.yml
@@ -0,0 +1,49 @@
+name: Publish package python distribution to Pypi
+
+on:
+  release:
+    types: [published]
+  workflow_dispatch:
+
+jobs:
+    build:
+      name: Build distribution
+      runs-on: ubuntu-latest
+      steps:
+      - uses: actions/checkout@v4
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: 3.12.7
+      - name: Install pypi/build
+        run: >-
+          python3 -m
+          pip install
+          build
+          --user
+      - name: Build a binary wheel and a source tarball
+        run: python3 -m build
+      - name: Store the distribution packages
+        uses: actions/upload-artifact@v4
+        with:
+          name: python-package-distributions
+          path: dist/
+
+    publish-to-pypi:
+      name: Publish dist to PyPI
+      needs:
+      - build
+      runs-on: ubuntu-latest
+      environment:
+        name: pypi
+        url: https://pypi.org/p/buisciii-tools
+      permissions:
+        id-token: write
+      steps:
+      - name: Download all the dists
+        uses: actions/download-artifact@v4
+        with:
+          name: python-package-distributions
+          path: dist/
+      - name: Publish to PyPI
+        uses: pypa/gh-action-pypi-publish@release/v1

From 71d9b20d56725db46d1b2e5030b075a1e5e25025 Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Tue, 15 Oct 2024 13:46:55 +0200
Subject: [PATCH 285/321] Updated CHANGELOG

---
 CHANGELOG.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index b76da9b9a..61cf8d30c 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -10,12 +10,16 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 
 Code contributions to the new version:
 
+- [Pablo Mata](https://github.com/Shettland)
+
 ### Template fixes and updates
 
 ### Modules
 
 #### Added enhancements
 
+- Included a new github action to automatically publish releases to pypi [#351](https://github.com/BU-ISCIII/buisciii-tools/pull/351)
+
 #### Fixes
 
 #### Changed

From 4f8ba024b8db98bb8aa2a6b76387530959ebd393 Mon Sep 17 00:00:00 2001
From: Shettland <pyblus@gmail.com>
Date: Tue, 15 Oct 2024 13:55:21 +0200
Subject: [PATCH 286/321] Updated new pip instructions

---
 README.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index da5522a9f..dddebc622 100644
--- a/README.md
+++ b/README.md
@@ -31,7 +31,7 @@ BU-ISCIII provides a serie or services in its portfolio for supporting bioinform
 ```bash
 micromamba create -n buisciii -f environment.yml
 micromamba activate buisciii
-pip install --force-reinstall --upgrade git+https://github.com/bu-isciii/buisciii-tools.git@main
+pip install buisciii-tools
 ```
 
 or
@@ -40,7 +40,7 @@ or
 git checkout main
 conda create -n buisciii -f environment.yml
 conda activate 
-pip install .
+pip install buisciii-tools
 ```
 
 ### Dev version

From 232fe747e7d6e2cfb814f519a72fc2b16e5b2b2e Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 28 Oct 2024 12:14:34 +0100
Subject: [PATCH 287/321] Updated the fix-permissions module in __main__.py

---
 bu_isciii/__main__.py | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/bu_isciii/__main__.py b/bu_isciii/__main__.py
index 1aebd7805..a1cf21be7 100755
--- a/bu_isciii/__main__.py
+++ b/bu_isciii/__main__.py
@@ -655,6 +655,7 @@ def autoclean_sftp(ctx, sftp_folder, days):
     "-d",
     "--input_directory",
     type=click.Path(),
+    multiple=True,
     default=None,
     required=True,
     help="Input directory to fix permissions (absolute path)",
@@ -664,15 +665,18 @@ def fix_permissions(ctx, input_directory):
     """
     Fix permissions
     """
-    if not os.path.isdir(input_directory):
-        exit("Invalid input directory")
     conf = bu_isciii.config_json.ConfigJson()
     permissions = conf.get_configuration("global").get("permissions")
-    bu_isciii.utils.remake_permissions(input_directory, permissions)
     stderr = rich.console.Console(
         stderr=True, force_terminal=bu_isciii.utils.rich_force_colors()
     )
-    stderr.print(f"[green]Correct permissions were applied to {input_directory}")
+
+    for directory in input_directory:
+        if not os.path.isdir(directory):
+            stderr.print(f"[red]Invalid input directory: {directory}")
+            continue
+        bu_isciii.utils.remake_permissions(directory, permissions)
+        stderr.print(f"[green]Correct permissions were applied to {directory}")
 
 
 if __name__ == "__main__":

From ccdc0b8a12bc33ad2c8a6d4dc1efd9043b7c4d32 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 28 Oct 2024 12:18:34 +0100
Subject: [PATCH 288/321] Updated taxprofiler.config

---
 bu_isciii/templates/mag/DOC/taxprofiler.config | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/mag/DOC/taxprofiler.config b/bu_isciii/templates/mag/DOC/taxprofiler.config
index 60569c0ac..1d05137fc 100644
--- a/bu_isciii/templates/mag/DOC/taxprofiler.config
+++ b/bu_isciii/templates/mag/DOC/taxprofiler.config
@@ -5,7 +5,7 @@
 singularity {
     enabled                 = true
     autoMounts              = true
-    singularity.cacheDir    = '/data/cnm/ratb/pipelines/singularity-images/'
+    singularity.cacheDir    = '/data/bi/pipelines/singularity-images/'
 }
 
 process {

From 87ed16d06248f51ea81b2124a64235b0775bd57a Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 28 Oct 2024 12:19:05 +0100
Subject: [PATCH 289/321] Updated sftp_user.json

---
 bu_isciii/templates/sftp_user.json | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/sftp_user.json b/bu_isciii/templates/sftp_user.json
index 344c8b49e..a9cb63092 100755
--- a/bu_isciii/templates/sftp_user.json
+++ b/bu_isciii/templates/sftp_user.json
@@ -54,5 +54,6 @@
     "bbaladron": ["SpainUDP"],
     "bioinfoadm": ["test"],
     "s.varona": ["misc"],
-    "nlabiod": ["Labarbovirus"]
+    "nlabiod": ["Labarbovirus"],
+    "jmgonzalez": ["Lablegionella"],
 }

From 0d8ab7eec5a087366ea68b3419a6a596bc4f453d Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 28 Oct 2024 12:21:27 +0100
Subject: [PATCH 290/321] Fixed viralrecon's lablog and remove_columns script

---
 bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon       | 1 +
 .../viralrecon/ANALYSIS/remove_columns_mapping_table.sh         | 2 +-
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index ec944be38..f80d4524a 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -479,6 +479,7 @@ do
     cp create_summary_report.sh ${FOLDER_NAME}/
     cp deduplicate_long_table.sh ${FOLDER_NAME}/
     cp percentajeNs.py ${FOLDER_NAME}/
+    cp remove_columns_mapping_table.sh ${FOLDER_NAME}/
     grep -i ${in} samples_ref.txt | cut -f1,2 > ${FOLDER_NAME}/samples_ref.txt
     echo "ln -s ../00-reads ." > ${FOLDER_NAME}/lablog
     printf "ln -s ../samples_id.txt .\n\n" >> ${FOLDER_NAME}/lablog
diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/remove_columns_mapping_table.sh b/bu_isciii/templates/viralrecon/ANALYSIS/remove_columns_mapping_table.sh
index 434c51c92..97e769d83 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/remove_columns_mapping_table.sh
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/remove_columns_mapping_table.sh
@@ -3,7 +3,7 @@
 output_file=$(echo processed_mapping_illumina_$(date '+%Y%m%d').tab)
 
 # Removal of the first three columns of the mapping illumina tab file
-cut --complement -f1-3 mapping_*.tab > output_file
+cut --complement -f1-3 mapping_*.tab > $output_file
 mv $output_file mapping_illumina_$(date '+%Y%m%d').tab
 
 # Success message

From fd33b735aa457bd85fbb46a75e98f5b62096a62f Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 28 Oct 2024 12:22:16 +0100
Subject: [PATCH 291/321] Updated mtbseq templates

---
 .../ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/all_samples/lablog | 6 +++---
 .../mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog      | 2 +-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/all_samples/lablog b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/all_samples/lablog
index d00741df8..99a74d18b 100644
--- a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/all_samples/lablog
+++ b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/all_samples/lablog
@@ -14,9 +14,9 @@ cd Mpileup; ln -s ../../*/Mpileup/* . ; cd -
 cd Position_Tables; ln -s ../../*/Position_Tables/* . ; cd -
 
 ##### Create join scripts
-echo "srun --job-name MTBSEQ_JOIN  --output logs/MTBSEQ_JOIN.%j.log --partition middle_obx --mem 48G --chdir ${scratch_dir} --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../../ /data/bi/pipelines/singularity-images/mtbseq:1.0.4—hdfd78af_2 MTBseq --step TBjoin --threads 5 --samples ${scratch_dir}/samples.txt &" > _01_tb_join.sh
-echo "srun --job-name MTBSEQ_AMEND  --output logs/MTBSEQ_AMEND.%j.log --partition middle_obx --mem 48G --chdir ${scratch_dir} --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../../ /data/bi/pipelines/singularity-images/mtbseq:1.0.4—hdfd78af_2 MTBseq --step TBamend --threads 5 --samples ${scratch_dir}/samples.txt &" > _02_tb_amend.sh
-echo "srun --job-name MTBSEQ_GROUPS --output logs/MTBSEQ_GROUPS.%j.log --partition middle_obx --mem 48G --chdir ${scratch_dir} --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../../ /data/bi/pipelines/singularity-images/mtbseq:1.0.4—hdfd78af_2 MTBseq --step TBgroups --threads 5 --samples ${scratch_dir}/samples.txt &" > _03_tb_groups.sh
+echo "srun --job-name MTBSEQ_JOIN  --output logs/MTBSEQ_JOIN.%j.log --partition middle_obx --mem 48G --chdir ${scratch_dir} --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../../ /data/bi/pipelines/singularity-images/mtbseq:1.1.0--hdfd78af_0 MTBseq --step TBjoin --threads 5 --samples ${scratch_dir}/samples.txt &" > _01_tb_join.sh
+echo "srun --job-name MTBSEQ_AMEND  --output logs/MTBSEQ_AMEND.%j.log --partition middle_obx --mem 48G --chdir ${scratch_dir} --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../../ /data/bi/pipelines/singularity-images/mtbseq:1.1.0--hdfd78af_0 MTBseq --step TBamend --threads 5 --samples ${scratch_dir}/samples.txt &" > _02_tb_amend.sh
+echo "srun --job-name MTBSEQ_GROUPS --output logs/MTBSEQ_GROUPS.%j.log --partition middle_obx --mem 48G --chdir ${scratch_dir} --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../../ /data/bi/pipelines/singularity-images/mtbseq:1.1.0--hdfd78af_0 MTBseq --step TBgroups --threads 5 --samples ${scratch_dir}/samples.txt &" > _03_tb_groups.sh
 
 #### Execute iqtree
 echo "srun --chdir ${scratch_dir} --output logs/IQTREEFULLALIGN.%j.log --job-name IQTREEFULLALIGN --cpus-per-task 20 --mem 15G --partition short_idx --time 08:00:00 singularity exec -B ${scratch_dir}/../../../../ /data/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/Amend/*amended_u95_phylo_w12.plainIDs.fasta -m K3Pu+F+I -T 20 -B 1000 -pre phylo.iqtree.bootstrap &" > _04_iqtreeall.sh
diff --git a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
index 0eff79004..55345c6d5 100644
--- a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
+++ b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
@@ -9,7 +9,7 @@ cat ../samples_id.txt | xargs -I % echo "mkdir %; ln -s ../../01-preprocessing/%
 cat ../samples_id.txt | xargs -I % echo "ln -s ../../01-preprocessing/%/%_R2_filtered.fastq.gz %/%_lib1_R2.fastq.gz" >> _00_prepareRaw.sh
 cat ../samples_id.txt | xargs -I % echo "cd %;ls *.fastq.gz | tr '_' '\t' | cut -f 1,2 | sort -u > samples.txt;cd -" > _01_preparesamples.sh
 
-cat ../samples_id.txt | xargs -I @@ echo -e "srun --job-name MTBSEQ.@@  --output logs/MTBSEQ.@@.%j.log --partition middle_idx --mem 48G --chdir ${scratch_dir}/@@ --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/mtbseq:1.0.4--hdfd78af_2 MTBseq --step TBfull --threads 10 --samples samples.txt &" > _02_mtbseq.sh
+cat ../samples_id.txt | xargs -I @@ echo -e "srun --job-name MTBSEQ.@@  --output logs/MTBSEQ.@@.%j.log --partition middle_idx --mem 48G --chdir ${scratch_dir}/@@ --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/mtbseq:1.1.0--hdfd78af_0 MTBseq --step TBfull --threads 10 --samples samples.txt &" > _02_mtbseq.sh
 
 # classification
 echo "mkdir classification_all" > _03_gather_results.sh 

From a0324ed3b6376257b951920dfe362f17595fec04 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 28 Oct 2024 12:23:18 +0100
Subject: [PATCH 292/321] Updated bioinfo_doc.py to handle the Unable to send
 e-mail error message

---
 bu_isciii/bioinfo_doc.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index 519cb382d..4654f9ede 100644
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -715,7 +715,7 @@ def send_email(self, html_text, results_pdf_file):
             server.ehlo()
             server.login(user=email_host_user, password=email_host_password)
         except Exception as e:
-            stderr.print("[red] Unable to send e-mail" + e)
+            stderr.print("[red] Unable to send e-mail: " + str(e))
         default_cc = "bioinformatica@isciii.es"
         msg = MIMEMultipart("alternative")
         msg["To"] = self.resolution_info["service_user_id"]["email"]

From 088195d365b9c7a7fb9f832c1835915b0a5ec11b Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 28 Oct 2024 12:28:08 +0100
Subject: [PATCH 293/321] Updated new_service.py to check FASTQ integrity

---
 bu_isciii/new_service.py | 29 +++++++++++++++++++++++++++++
 1 file changed, 29 insertions(+)

diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index 0bcf65561..9cb4bca6a 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -8,6 +8,7 @@
 import json
 import shutil
 import rich
+import subprocess
 
 # Local imports
 import bu_isciii
@@ -88,7 +89,35 @@ def __init__(
             )
         self.full_path = os.path.join(self.path, self.service_folder)
 
+    def check_md5(self):
+            # Path to the .md5 file
+            project_name = self.service_samples[0]["project_name"]
+            md5_file_path = f"/srv/fastq_repo/{project_name}/md5sum_{project_name}.md5"
+            if not os.path.exists(md5_file_path):
+                stderr.print(f"[red]ERROR: .md5 file not found at {md5_file_path}")
+                sys.exit(1)
+
+            original_dir = os.getcwd()
+            md5_dir = os.path.dirname(md5_file_path)
+            os.chdir(md5_dir)
+
+            # md5sum command
+            stderr.print(f"[blue]Checking MD5 integrity for {md5_file_path}")
+            try:
+                result = subprocess.run(
+                    ['md5sum', '-c', os.path.basename(md5_file_path)],
+                    check=True,
+                    )
+                stderr.print(f"[green]MD5 check passed!")
+            except subprocess.CalledProcessError as e:
+                stderr.print(f"[red]ERROR: MD5 check failed: {e.stderr}")
+                sys.exit(1)
+            finally:
+                os.chdir(original_dir)
+
+
     def create_folder(self):
+        self.check_md5()
         if not self.no_create_folder:
             stderr.print(
                 "[blue]I will create the service folder for " + self.resolution_id + "!"

From 7d2064eefccccd68e380d717b3b6f248329ea43e Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 28 Oct 2024 12:42:18 +0100
Subject: [PATCH 294/321] Updated CHANGELOG.md, setup.py and __main__.py

---
 CHANGELOG.md          | 45 +++++++++++++++++++++++++++++++++++++++++++
 bu_isciii/__main__.py |  2 +-
 setup.py              |  2 +-
 3 files changed, 47 insertions(+), 2 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 61cf8d30c..2050d3068 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -8,12 +8,57 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 
 ### Credits
 
+### Template fixes and updates
+
+### Modules
+
+#### Added enhancements
+
+#### Fixes
+
+#### Changed
+
+#### Removed
+
+### Requirements
+
+## [2.X.Xhot] - 2024-0X-0X : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.X.2
+
+### Credits
+
+### Template fixes and updates
+
+### Modules
+
+#### Added enhancements
+
+#### Fixes
+
+#### Changed
+
+#### Removed
+
+### Requirements
+
+## [2.2.2] - 2024-10-28 : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.2.2
+
+### Credits
+
 Code contributions to the new version:
 
 - [Pablo Mata](https://github.com/Shettland)
+- [Victor Lopez](https://github.com/victor5lm)
 
 ### Template fixes and updates
 
+- Updated the fix-permissions module in __main__.py [#356](https://github.com/BU-ISCIII/buisciii-tools/pull/356).
+- Fixed the singularity cache directory in taxprofiler.config [#356](https://github.com/BU-ISCIII/buisciii-tools/pull/356).
+- Updated sftp_user.json [#356](https://github.com/BU-ISCIII/buisciii-tools/pull/356).
+- Fixed viralrecon's lablog and the remove_columns_mapping_table.sh auxiliary script [#356](https://github.com/BU-ISCIII/buisciii-tools/pull/356).
+- Updated the singularity image in the mtbseq templates [#356](https://github.com/BU-ISCIII/buisciii-tools/pull/356).
+- Fixed a bug in bioinfo_doc.py [#356](https://github.com/BU-ISCIII/buisciii-tools/pull/356).
+- Updated new_service.py to check FASTQ integrity via md5sum [#356](https://github.com/BU-ISCIII/buisciii-tools/pull/356).
+
 ### Modules
 
 #### Added enhancements
diff --git a/bu_isciii/__main__.py b/bu_isciii/__main__.py
index a1cf21be7..a7e958ae4 100755
--- a/bu_isciii/__main__.py
+++ b/bu_isciii/__main__.py
@@ -57,7 +57,7 @@ def run_bu_isciii():
     )
 
     # stderr.print("[green]                                          `._,._,'\n", highlight=False)
-    __version__ = "2.2.1"
+    __version__ = "2.2.2"
     stderr.print(
         "[grey39]    BU-ISCIII-tools version {}".format(__version__), highlight=False
     )
diff --git a/setup.py b/setup.py
index 50fdff3dc..679386268 100755
--- a/setup.py
+++ b/setup.py
@@ -2,7 +2,7 @@
 
 from setuptools import setup, find_packages
 
-version = "2.2.1"
+version = "2.2.2"
 
 with open("README.md") as f:
     readme = f.read()

From ece6b0154aa954cefad7464e8f39bba0eb0a0f69 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 28 Oct 2024 12:58:30 +0100
Subject: [PATCH 295/321] Fixed some linting mistakes in new_service.py

---
 bu_isciii/new_service.py | 44 +++++++++++++++++++---------------------
 1 file changed, 21 insertions(+), 23 deletions(-)

diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index 9cb4bca6a..a974d4f6e 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -90,31 +90,29 @@ def __init__(
         self.full_path = os.path.join(self.path, self.service_folder)
 
     def check_md5(self):
-            # Path to the .md5 file
-            project_name = self.service_samples[0]["project_name"]
-            md5_file_path = f"/srv/fastq_repo/{project_name}/md5sum_{project_name}.md5"
-            if not os.path.exists(md5_file_path):
-                stderr.print(f"[red]ERROR: .md5 file not found at {md5_file_path}")
-                sys.exit(1)
-
-            original_dir = os.getcwd()
-            md5_dir = os.path.dirname(md5_file_path)
-            os.chdir(md5_dir)
+        # Path to the .md5 file
+        project_name = self.service_samples[0]["project_name"]
+        md5_file_path = f"/srv/fastq_repo/{project_name}/md5sum_{project_name}.md5"
+        if not os.path.exists(md5_file_path):
+            stderr.print(f"[red]ERROR: .md5 file not found at {md5_file_path}")
+            sys.exit(1)
 
-            # md5sum command
-            stderr.print(f"[blue]Checking MD5 integrity for {md5_file_path}")
-            try:
-                result = subprocess.run(
-                    ['md5sum', '-c', os.path.basename(md5_file_path)],
-                    check=True,
-                    )
-                stderr.print(f"[green]MD5 check passed!")
-            except subprocess.CalledProcessError as e:
-                stderr.print(f"[red]ERROR: MD5 check failed: {e.stderr}")
-                sys.exit(1)
-            finally:
-                os.chdir(original_dir)
+        original_dir = os.getcwd()
+        md5_dir = os.path.dirname(md5_file_path)
+        os.chdir(md5_dir)
 
+        # md5sum command
+        stderr.print(f"[blue]Checking MD5 integrity for {md5_file_path}")
+        try:
+            subprocess.run(
+                ['md5sum', '-c', os.path.basename(md5_file_path)],
+                check=True)
+            stderr.print("[green]MD5 check passed!")
+        except subprocess.CalledProcessError as e:
+            stderr.print(f"[red]ERROR: MD5 check failed: {e.stderr}")
+            sys.exit(1)
+        finally:
+            os.chdir(original_dir)
 
     def create_folder(self):
         self.check_md5()

From 573b691532c17c926701fdc8e9d91dc1392ff2c3 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 28 Oct 2024 13:00:18 +0100
Subject: [PATCH 296/321] Ran black on new_service.py

---
 bu_isciii/new_service.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index a974d4f6e..cb1ecb92f 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -105,8 +105,8 @@ def check_md5(self):
         stderr.print(f"[blue]Checking MD5 integrity for {md5_file_path}")
         try:
             subprocess.run(
-                ['md5sum', '-c', os.path.basename(md5_file_path)],
-                check=True)
+                ["md5sum", "-c", os.path.basename(md5_file_path)], check=True
+            )
             stderr.print("[green]MD5 check passed!")
         except subprocess.CalledProcessError as e:
             stderr.print(f"[red]ERROR: MD5 check failed: {e.stderr}")

From 922e14bfb2bbcb494a2bdf8aa15fe193007612fe Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 28 Oct 2024 13:03:08 +0100
Subject: [PATCH 297/321] Removed an extra comma from sftp_user.json

---
 bu_isciii/templates/sftp_user.json | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/sftp_user.json b/bu_isciii/templates/sftp_user.json
index a9cb63092..ba6278583 100755
--- a/bu_isciii/templates/sftp_user.json
+++ b/bu_isciii/templates/sftp_user.json
@@ -55,5 +55,5 @@
     "bioinfoadm": ["test"],
     "s.varona": ["misc"],
     "nlabiod": ["Labarbovirus"],
-    "jmgonzalez": ["Lablegionella"],
+    "jmgonzalez": ["Lablegionella"]
 }

From f5cfa8f184419db19e4da5b51e248524e7dfe33c Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 29 Oct 2024 09:44:34 +0100
Subject: [PATCH 298/321] Removed conda env line from viralrecon's results
 lablog

---
 bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results | 1 -
 1 file changed, 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results b/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
index d05b2ab77..31bbdfd1a 100755
--- a/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
+++ b/bu_isciii/templates/viralrecon/RESULTS/lablog_viralrecon_results
@@ -25,7 +25,6 @@ ln -s ../../ANALYSIS/*/mapping_illumina*.tab ./mapping_illumina.csv
 ln -s ../../ANALYSIS/*/assembly_stats.csv ./assembly_stats.csv
 ln -s ../../ANALYSIS/*/01-PikaVirus-results/all_samples_virus_table_filtered.tsv ./pikavirus_table.tsv
 
-#conda activate viralrecon_report
 echo "python ./excel_generator.py -r ./references.tmp --merge_lineage_files" > _01_generate_excel_files.sh
 #Cleaning temp files and broken symbolic links
 echo "find . -xtype l -delete" > _02_clean_folders.sh

From 56c795b358f012f82a4e19a7c577389959f7a136 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 29 Oct 2024 10:17:40 +0100
Subject: [PATCH 299/321] Substituted /srv/fastq_repo by its variable name

---
 bu_isciii/new_service.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index cb1ecb92f..ac43fd85e 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -92,7 +92,7 @@ def __init__(
     def check_md5(self):
         # Path to the .md5 file
         project_name = self.service_samples[0]["project_name"]
-        md5_file_path = f"/srv/fastq_repo/{project_name}/md5sum_{project_name}.md5"
+        md5_file_path = f'{self.conf["fastq_repo"]}/{project_name}/md5sum_{project_name}.md5'
         if not os.path.exists(md5_file_path):
             stderr.print(f"[red]ERROR: .md5 file not found at {md5_file_path}")
             sys.exit(1)

From 91b561cc250841d15ebdbed1a1b4062ce76c6d72 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 29 Oct 2024 10:19:12 +0100
Subject: [PATCH 300/321] Ran black on new_service.py

---
 bu_isciii/new_service.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index ac43fd85e..e22bcde14 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -92,7 +92,9 @@ def __init__(
     def check_md5(self):
         # Path to the .md5 file
         project_name = self.service_samples[0]["project_name"]
-        md5_file_path = f'{self.conf["fastq_repo"]}/{project_name}/md5sum_{project_name}.md5'
+        md5_file_path = (
+            f'{self.conf["fastq_repo"]}/{project_name}/md5sum_{project_name}.md5'
+        )
         if not os.path.exists(md5_file_path):
             stderr.print(f"[red]ERROR: .md5 file not found at {md5_file_path}")
             sys.exit(1)

From b694e9eee61c5cdc478fde101585b06ca645ba8f Mon Sep 17 00:00:00 2001
From: "github-actions[bot]"
 <41898282+github-actions[bot]@users.noreply.github.com>
Date: Tue, 29 Oct 2024 11:06:09 +0100
Subject: [PATCH 301/321] Merge changes from main into hotfix (#195) (#359)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com>
Co-authored-by: Sara Monzón <sara.monzon.fdz@gmail.com>
Co-authored-by: Pablo Mata <76519482+Shettland@users.noreply.github.com>
Co-authored-by: Víctor López <98259577+victor5lm@users.noreply.github.com>

From d23529940722fac3d32c8c1c67a5ac068a2ef0fe Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 12 Nov 2024 22:51:47 +0100
Subject: [PATCH 302/321] Added alberto.campoy to sftp_user.json

---
 bu_isciii/templates/sftp_user.json | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/sftp_user.json b/bu_isciii/templates/sftp_user.json
index ba6278583..5e3915a56 100755
--- a/bu_isciii/templates/sftp_user.json
+++ b/bu_isciii/templates/sftp_user.json
@@ -55,5 +55,6 @@
     "bioinfoadm": ["test"],
     "s.varona": ["misc"],
     "nlabiod": ["Labarbovirus"],
-    "jmgonzalez": ["Lablegionella"]
+    "jmgonzalez": ["Lablegionella"],
+    "alberto.campoy": ["Labvirusres"]
 }

From a1699124551b26b5477e3874a6a7851f7acd6d11 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 12 Nov 2024 22:52:21 +0100
Subject: [PATCH 303/321] Fixed the md5sum function to check only the integrity
 of the files related to the service

---
 bu_isciii/new_service.py | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index e22bcde14..4e4f09066 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -92,9 +92,7 @@ def __init__(
     def check_md5(self):
         # Path to the .md5 file
         project_name = self.service_samples[0]["project_name"]
-        md5_file_path = (
-            f'{self.conf["fastq_repo"]}/{project_name}/md5sum_{project_name}.md5'
-        )
+        md5_file_path = f'{self.conf["fastq_repo"]}/{project_name}/md5sum_{project_name}.md5'
         if not os.path.exists(md5_file_path):
             stderr.print(f"[red]ERROR: .md5 file not found at {md5_file_path}")
             sys.exit(1)
@@ -103,11 +101,17 @@ def check_md5(self):
         md5_dir = os.path.dirname(md5_file_path)
         os.chdir(md5_dir)
 
+        # Regex pattern to match sample names in .fastq.gz files
+        sample_names_pattern = "|".join(
+        [f"{sample['sample_name']}.*\\.fastq\\.gz" for sample in self.service_samples]
+    )
+
         # md5sum command
         stderr.print(f"[blue]Checking MD5 integrity for {md5_file_path}")
         try:
+            cmd = f"grep -E '{sample_names_pattern}' {md5_file_path} | md5sum -c"
             subprocess.run(
-                ["md5sum", "-c", os.path.basename(md5_file_path)], check=True
+                cmd, shell=True, check=True, executable='/bin/bash'
             )
             stderr.print("[green]MD5 check passed!")
         except subprocess.CalledProcessError as e:

From eb3237323355eb154c9bdabb474d3414f0e80e9f Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 12 Nov 2024 22:52:52 +0100
Subject: [PATCH 304/321] Added the locus_tag option to the PROKKA process in
 the bacass config file

---
 bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config b/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config
index 8325bcd5f..5ef28493b 100644
--- a/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config
+++ b/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config
@@ -195,7 +195,8 @@ process {
         ext.args = {
             [
                 '--force',
-                params.prokka_args ? "${params.prokka_args}" : ''
+                params.prokka_args ? "${params.prokka_args}" : '',
+                "--locustag ${meta.id}"
             ].join(' ').trim()
         }
         publishDir = [

From 6e1a2a1a2d49b7367f63710a5a75d7cefcfa053e Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 13 Nov 2024 10:58:19 +0100
Subject: [PATCH 305/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 2050d3068..f38641d79 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -8,8 +8,14 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 
 ### Credits
 
+Code contributions to the new version:
+
+- [Victor Lopez](https://github.com/victor5lm)
+
 ### Template fixes and updates
 
+- Updated sftp_user.json, added the locus-tag option for the PROKKA process in the bacass config file and changed new_service.py so that integrity is checked only for the samples of interest [#363](https://github.com/BU-ISCIII/buisciii-tools/pull/363).
+
 ### Modules
 
 #### Added enhancements

From 64c1d8c4eb4a520696464f82b50225d1837bc0c9 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Wed, 13 Nov 2024 11:01:30 +0100
Subject: [PATCH 306/321] Ran black on new_service.py

---
 bu_isciii/new_service.py | 15 +++++++++------
 1 file changed, 9 insertions(+), 6 deletions(-)

diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index 4e4f09066..afc8d4b13 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -92,7 +92,9 @@ def __init__(
     def check_md5(self):
         # Path to the .md5 file
         project_name = self.service_samples[0]["project_name"]
-        md5_file_path = f'{self.conf["fastq_repo"]}/{project_name}/md5sum_{project_name}.md5'
+        md5_file_path = (
+            f'{self.conf["fastq_repo"]}/{project_name}/md5sum_{project_name}.md5'
+        )
         if not os.path.exists(md5_file_path):
             stderr.print(f"[red]ERROR: .md5 file not found at {md5_file_path}")
             sys.exit(1)
@@ -103,16 +105,17 @@ def check_md5(self):
 
         # Regex pattern to match sample names in .fastq.gz files
         sample_names_pattern = "|".join(
-        [f"{sample['sample_name']}.*\\.fastq\\.gz" for sample in self.service_samples]
-    )
+            [
+                f"{sample['sample_name']}.*\\.fastq\\.gz"
+                for sample in self.service_samples
+            ]
+        )
 
         # md5sum command
         stderr.print(f"[blue]Checking MD5 integrity for {md5_file_path}")
         try:
             cmd = f"grep -E '{sample_names_pattern}' {md5_file_path} | md5sum -c"
-            subprocess.run(
-                cmd, shell=True, check=True, executable='/bin/bash'
-            )
+            subprocess.run(cmd, shell=True, check=True, executable="/bin/bash")
             stderr.print("[green]MD5 check passed!")
         except subprocess.CalledProcessError as e:
             stderr.print(f"[red]ERROR: MD5 check failed: {e.stderr}")

From 177cb559f391dc70eb3da82f11752adf513824b3 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 28 Nov 2024 13:04:55 +0100
Subject: [PATCH 307/321] Fixed code to propperly handle a service withput
 samples

---
 bu_isciii/new_service.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index afc8d4b13..b1b1d4dec 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -63,7 +63,7 @@ def __init__(
         self.services_requested = self.resolution_info["resolutions"][0][
             "available_services"
         ]
-        self.service_samples = self.resolution_info.get("samples", None)
+        self.service_samples = self.resolution_info.get("samples")
 
         if ask_path and path is None:
             stderr.print("Directory where you want to create the service folder.")
@@ -124,7 +124,6 @@ def check_md5(self):
             os.chdir(original_dir)
 
     def create_folder(self):
-        self.check_md5()
         if not self.no_create_folder:
             stderr.print(
                 "[blue]I will create the service folder for " + self.resolution_id + "!"
@@ -258,7 +257,8 @@ def samples_json(self):
         f.close()
 
     def create_new_service(self):
-        if self.service_samples is not None:
+        if len(self.service_samples) > 0:
+            self.check_md5()
             self.create_folder()
             self.copy_template()
             self.create_samples_id()
@@ -277,7 +277,7 @@ def create_new_service(self):
             stderr.print(
                 "[yellow]WARN: No samples recorded in service: " + self.resolution_id
             )
-            if bu_isciii.utils.prompt_yn_question("Do you want to proceed?: "):
+            if bu_isciii.utils.prompt_yn_question("Do you want to proceed?: ", dflt=True):
                 self.create_folder()
                 self.copy_template()
                 if self.resolution_info["service_state"] != "in_progress":

From acfa0b55be22eca6f7ca21094bc30e1ce0c05b00 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 28 Nov 2024 13:09:10 +0100
Subject: [PATCH 308/321] updated changelog

---
 CHANGELOG.md | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index f38641d79..8b1f277db 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -11,6 +11,7 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 Code contributions to the new version:
 
 - [Victor Lopez](https://github.com/victor5lm)
+- [Sarai Varona](https://github.com/svarona)
 
 ### Template fixes and updates
 
@@ -22,6 +23,8 @@ Code contributions to the new version:
 
 #### Fixes
 
+- Fixed new-service to correctly handle when there are no samples in service [#372](https://github.com/BU-ISCIII/buisciii-tools/pull/372). Fixes issue [#371](https://github.com/BU-ISCIII/buisciii-tools/issues/371)
+
 #### Changed
 
 #### Removed

From c45324d18c951e94ba554196d348cbfd7f7e36a7 Mon Sep 17 00:00:00 2001
From: svarona <sarai.var.fer@gmail.com>
Date: Thu, 28 Nov 2024 14:22:41 +0100
Subject: [PATCH 309/321] fixed linting

---
 bu_isciii/new_service.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/bu_isciii/new_service.py b/bu_isciii/new_service.py
index b1b1d4dec..db0461d2d 100755
--- a/bu_isciii/new_service.py
+++ b/bu_isciii/new_service.py
@@ -277,7 +277,9 @@ def create_new_service(self):
             stderr.print(
                 "[yellow]WARN: No samples recorded in service: " + self.resolution_id
             )
-            if bu_isciii.utils.prompt_yn_question("Do you want to proceed?: ", dflt=True):
+            if bu_isciii.utils.prompt_yn_question(
+                "Do you want to proceed?: ", dflt=True
+            ):
                 self.create_folder()
                 self.copy_template()
                 if self.resolution_info["service_state"] != "in_progress":

From fd7e4941cfa5415230ec06100c2caa7d3df75e07 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 23 Dec 2024 12:21:28 +0100
Subject: [PATCH 310/321] Changed read_length variable creation to add read
 length correctly to mapping_illumina.tab

---
 .../templates/viralrecon/ANALYSIS/create_summary_report.sh      | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/create_summary_report.sh b/bu_isciii/templates/viralrecon/ANALYSIS/create_summary_report.sh
index f57349842..109e837d0 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/create_summary_report.sh
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/create_summary_report.sh
@@ -42,7 +42,7 @@ do
     medianDPcov=$(echo "$metrics" | cut -d ',' -f8)
     cov10x=$(echo "$metrics" | cut -d ',' -f10)
 
-    read_length=$(cat ${arr[1]}*/multiqc/multiqc_data/multiqc_fastqc.yaml | grep -A5 "${arr[0]}_1:$" | grep "Sequence length:" | tr "-" " " | rev | cut -d " " -f1 | rev)
+    read_length=$(cat ${arr[1]}*/multiqc/multiqc_data/multiqc_fastqc.yaml | grep -A5 -E "'?${arr[0]}_1'?:$" | grep "Sequence length:" | tr "-" " " | rev | cut -d " " -f1 | rev)
 
     analysis_date=$(date '+%Y%m%d')
 

From 4acd0ea36ad9d6c601beebe9f6e4d024160acbcb Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 23 Dec 2024 12:24:25 +0100
Subject: [PATCH 311/321] Changed "Buenas" by "Estimado/a" in email.j2

---
 bu_isciii/templates/email.j2 | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bu_isciii/templates/email.j2 b/bu_isciii/templates/email.j2
index ce55f3e96..cecdefbf9 100644
--- a/bu_isciii/templates/email.j2
+++ b/bu_isciii/templates/email.j2
@@ -84,7 +84,7 @@
                                               </tbody>
                                             </table>
                                             <div class="space-y-3">
-                                              <p class="text-gray-700" style="line-height: 24px; font-size: 16px; color: #4a5568; width: 100%; margin: 0;" align="left">Buenas {{ user_data.first_name }},</p>
+                                              <p class="text-gray-700" style="line-height: 24px; font-size: 16px; color: #4a5568; width: 100%; margin: 0;" align="left">Estimado/a {{ user_data.first_name }},</p>
                                               <table class="s-3 w-full" role="presentation" border="0" cellpadding="0" cellspacing="0" style="width: 100%;" width="100%">
                                                 <tbody>
                                                   <tr>

From eb09ec0424dae9caa4812008f5ed339cad67bdd3 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 23 Dec 2024 12:25:39 +0100
Subject: [PATCH 312/321] Updated create_irma_stats.sh to include %mapped_reads

---
 .../ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_stats.sh    | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_stats.sh b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_stats.sh
index 93f0ffec2..cc39eb168 100755
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_stats.sh
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/create_irma_stats.sh
@@ -6,6 +6,7 @@ do
 SAMPLE_ID=$(echo ${in})
 TOTAL_READS=$(grep '1-initial' ${in}/tables/READ_COUNTS.txt | cut -f2)
 MAPPEDREADS=$(grep '3-match' ${in}/tables/READ_COUNTS.txt | cut -f2)
+PCTMAPPED=$(awk "BEGIN {printf \"%.2f\", ($MAPPEDREADS/$TOTAL_READS)*100}")
 FLU_TYPE=$(paste <(grep '4-[A-C]_MP' ${in}/tables/READ_COUNTS.txt | cut -f1 | cut -d '_' -f1 | cut -d '-' -f2) <(grep '4-[A-B]_HA' ${in}/tables/READ_COUNTS.txt | cut -f1 | cut -d '_' -f3 | cut -d '-' -f2) <(grep '4-[A-B]_NA' ${in}/tables/READ_COUNTS.txt | cut -f1 | cut -d '_' -f3) | tr '\t' '_')
 HA=$(grep '4-[A-C]_HA' ${in}/tables/READ_COUNTS.txt | cut -f2)
 MP=$(grep '4-[A-C]_MP' ${in}/tables/READ_COUNTS.txt | cut -f2)

From 053b1903b1f4b294c21293533f0c59e8478a39d8 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 23 Dec 2024 12:26:02 +0100
Subject: [PATCH 313/321] Changed /data/bi/ by /data/ucct/bi/ in all necessary
 files

---
 README.md                                     |  10 +-
 bu_isciii/__main__.py                         |  10 +-
 bu_isciii/bioinfo_doc.py                      |   2 +-
 bu_isciii/conf/configuration.json             |   2 +-
 bu_isciii/conf/configuration_dev.json         |   2 +-
 bu_isciii/schemas/deliver_automatization.json |   4 +-
 .../ANALYSIS01_FLU_IRMA/01-preproQC/lablog    |   2 +-
 .../02-preprocessing/lablog                   |   4 +-
 .../ANALYSIS01_FLU_IRMA/03-procQC/lablog      |   2 +-
 .../ANALYSIS01_FLU_IRMA/04-irma/lablog        |   2 +-
 .../ANALYSIS/ANALYSIS01_ASSEMBLY/lablog       |   6 +-
 .../assembly/DOC/hpc_slurm_assembly.config    |   2 +-
 .../blast_nt/ANALYSIS/ANALYSIS02_BLAST/lablog |  10 +-
 .../01-preprocessing/lablog                   |   4 +-
 .../02-ariba/lablog                           |   2 +-
 .../02-ariba/run/lablog                       |   4 +-
 .../02-ariba/summary/lablog                   |   2 +-
 .../03-amrfinderplus/lablog                   |   2 +-
 .../04-emmtyper/lablog                        |   4 +-
 .../05-mlva/lablog                            |   8 +-
 .../99-stats/lablog                           |   6 +-
 .../characterization/REFERENCES/lablog        |   6 +-
 .../ANALYSIS01_EXOME/02-postprocessing/lablog |  10 +-
 .../ANALYSIS01_EXOME/03-annotation/lablog     |   8 +-
 .../ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog |   2 +-
 .../exomeeb/ANALYSIS/ANALYSIS01_EXOME/lablog  |   8 +-
 .../ANALYSIS01_EXOME/02-postprocessing/lablog |  10 +-
 .../ANALYSIS01_EXOME/03-annotation/lablog     |  10 +-
 .../ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog |   2 +-
 .../ANALYSIS/ANALYSIS01_EXOME/lablog          |   8 +-
 .../ANALYSIS01_OUTBREAK/01-preproQC/lablog    |   2 +-
 .../02-preprocessing/lablog                   |   4 +-
 .../ANALYSIS01_OUTBREAK/03-procQC/lablog      |   2 +-
 .../ANALYSIS01_OUTBREAK/04-Alignment/lablog   |  10 +-
 .../ANALYSIS01_OUTBREAK/05-mark_dups/lablog   |   8 +-
 .../ANALYSIS01_OUTBREAK/06-freebayes/lablog   |   2 +-
 .../ANALYSIS01_OUTBREAK/07-snphylo/lablog     |   2 +-
 .../ANALYSIS01_OUTBREAK/08-iqtree/lablog      |   4 +-
 .../ANALYSIS01_OUTBREAK/99-stats/lablog       |   4 +-
 .../ANALYSIS/ANALYSIS02_MET/99-stats/lablog   |   2 +-
 .../ANALYSIS/ANALYSIS02_MET/lablog            |   4 +-
 .../ANALYSIS01_RBPANEL/01-fastQC/lablog       |   2 +-
 .../02-preprocessing/lablog                   |   2 +-
 .../ANALYSIS01_RBPANEL/03-preprocQC/lablog    |   2 +-
 .../ANALYSIS01_RBPANEL/04-mapping/lablog      |   6 +-
 .../ANALYSIS01_RBPANEL/05-samtools/lablog     |   2 +-
 .../ANALYSIS01_RBPANEL/06-VarScan/lablog      |   2 +-
 .../ANALYSIS01_RBPANEL/07-annotation/lablog   |   4 +-
 .../ANALYSIS01_RBPANEL/99-stats/lablog        |   4 +-
 .../ANALYSIS/ANALYSIS01_TAXPROFILER/lablog    |   4 +-
 .../ANALYSIS02_MAG_TAXONOMICS/99-stats/lablog |   2 +-
 .../ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog |   4 +-
 .../mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog    |   4 +-
 bu_isciii/templates/mag/DOC/databasesheet.csv |  10 +-
 bu_isciii/templates/mag/DOC/mag.config        |   2 +-
 .../templates/mag/DOC/taxprofiler.config      |   2 +-
 .../ANALYSIS01_MTBSEQ/01-preprocessing/lablog |   4 +-
 .../ANALYSIS01_MTBSEQ/02-kmerfinder/lablog    |   4 +-
 .../03-MTBSeq/all_samples/lablog              |  10 +-
 .../ANALYSIS01_MTBSEQ/03-MTBSeq/lablog        |   4 +-
 .../ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog      |   2 +-
 .../pikavirus/DOC/hpc_slurm_pikavirus.config  |  16 +--
 .../ANALYSIS/ANALYSIS02_PLASMIDID/lablog      |   4 +-
 .../plasmidID_annotation_config_file.txt      |  34 +++---
 .../ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog    |   2 +-
 .../rnaseq/DOC/candida_tropicalis_ncbi.yml    |   8 +-
 .../rnaseq/DOC/hg38_ensmbl_rnaseq.yml         |   8 +-
 .../ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog   |   6 +-
 bu_isciii/templates/services.json             |   2 +-
 .../ANALYSIS01_SNIPPY/01-fastqc/lablog        |   2 +-
 .../ANALYSIS01_SNIPPY/02-preprocessing/lablog |   4 +-
 .../ANALYSIS01_SNIPPY/03-preprocQC/lablog     |   2 +-
 .../ANALYSIS01_SNIPPY/04-snippy/lablog        |  14 +--
 .../ANALYSIS01_SNIPPY/05-iqtree/lablog        |   4 +-
 .../ANALYSIS01_SNIPPY/99-stats/lablog         |   4 +-
 .../viralrecon/ANALYSIS/lablog_viralrecon     | 106 +++++++++---------
 .../viralrecon/DOC/viralrecon.config          |   2 +-
 .../DOC/viralrecon_no_host_reads.config       |   2 +-
 .../viralrecon/DOC/viralrecon_params.yml      |   2 +-
 .../DOC/viralrecon_sars_nanopore.config       |   6 +-
 .../DOC/viralrecon_sars_nanopore_params.yml   |   6 +-
 .../02-postprocessing/lablog                  |  10 +-
 .../ANALYSIS01_GENOME/03-annotation/lablog    |  14 +--
 .../ANALYSIS01_GENOME/99-stats/lablog         |   2 +-
 .../wgstrio/ANALYSIS/ANALYSIS01_GENOME/lablog |   8 +-
 .../assembly.sbatch                           |   4 +-
 .../20221205_ANALYSIS01_ASSEMBLY/lablog       |   4 +-
 .../ANALYSIS/_01_copy_folder.sh               |   2 +-
 .../ANALYSIS/_02_copy_back.sh                 |   2 +-
 .../DOC/hpc_slurm_assembly.config             |   2 +-
 .../assembly.sbatch                           |   4 +-
 .../20221205_ANALYSIS01_ASSEMBLY/lablog       |   4 +-
 .../ANALYSIS/_01_copy_folder.sh               |   2 +-
 .../ANALYSIS/_02_copy_back.sh                 |   2 +-
 .../DOC/hpc_slurm_assembly.config             |   2 +-
 .../RotavirusA_11segments_viralrecon.sbatch   |   6 +-
 .../lablog                                    |   6 +-
 .../ANALYSIS/20221205_ANALYSIS03_MAG/lablog   |   4 +-
 .../20221205_ANALYSIS03_MAG/mag.sbatch        |   4 +-
 .../20221207_ANALYSIS04_BLAST/_02_blast.sh    |  14 +--
 .../ANALYSIS/20221207_ANALYSIS04_BLAST/lablog |   2 +-
 .../ANALYSIS/_01_copy_folder.sh               |   2 +-
 .../ANALYSIS/_02_copy_back.sh                 |   2 +-
 .../ANALYSIS/lablog                           |   4 +-
 .../ANALYSIS/ANALYSIS01_ASSEMBLY/lablog       |   6 +-
 .../DOC/hpc_slurm_assembly.config             |   2 +-
 .../DOC/hpc_slurm_assembly.config             |   2 +-
 .../DOC/hpc_slurm_assembly.config             |   2 +-
 108 files changed, 313 insertions(+), 313 deletions(-)

diff --git a/README.md b/README.md
index dddebc622..76e80bdc9 100644
--- a/README.md
+++ b/README.md
@@ -202,13 +202,13 @@ Options:
   -a, --ask_path                  Please ask for service path.
   -t, --tmp_dir PATH              Directory to which the files will be
                                   transfered for execution. Default:
-                                  /data/bi/scratch_tmp/bi/
+                                  /data/ucct/bi/scratch_tmp/bi/
   -d, --direction [service_to_scratch|scratch_to_service|remove_scratch]
                                   Direction of the rsync command.
-                                  service_to_scratch from /data/bi/service to
-                                  /data/bi/scratch_tmp/bi/.scratch_to_service:
-                                  From /data/bi/scratch_tmp/bi/ to
-                                  /data/bi/service
+                                  service_to_scratch from /data/ucct/bi/service to
+                                  /data/ucct/bi/scratch_tmp/bi/.scratch_to_service:
+                                  From /data/ucct/bi/scratch_tmp/bi/ to
+                                  /data/ucct/bi/service
   --help                          Show this message and exit.
 ```
 
diff --git a/bu_isciii/__main__.py b/bu_isciii/__main__.py
index a7e958ae4..3befb9eec 100755
--- a/bu_isciii/__main__.py
+++ b/bu_isciii/__main__.py
@@ -252,8 +252,8 @@ def new_service(ctx, resolution, path, no_create_folder, ask_path):
     "-t",
     "--tmp_dir",
     type=click.Path(),
-    default="/data/bi/scratch_tmp/bi/",
-    help="Directory to which the files will be transfered for execution. Default: /data/bi/scratch_tmp/bi/",
+    default="/data/ucct/bi/scratch_tmp/bi/",
+    help="Directory to which the files will be transfered for execution. Default: /data/ucct/bi/scratch_tmp/bi/",
 )
 @click.option(
     "-d",
@@ -262,8 +262,8 @@ def new_service(ctx, resolution, path, no_create_folder, ask_path):
     multiple=False,
     help=(
         "Direction of the rsync command. service_to_scratch "
-        "from /data/bi/service to /data/bi/scratch_tmp/bi/."
-        "scratch_to_service: From /data/bi/scratch_tmp/bi/ to /data/bi/service"
+        "from /data/ucct/bi/service to /data/ucct/bi/scratch_tmp/bi/."
+        "scratch_to_service: From /data/ucct/bi/scratch_tmp/bi/ to /data/ucct/bi/service"
     ),
 )
 @click.pass_context
@@ -411,7 +411,7 @@ def copy_sftp(ctx, resolution, path, ask_path, sftp_folder):
     "-t",
     "--tmp_dir",
     type=click.Path(),
-    default="/data/bi/scratch_tmp/bi/",
+    default="/data/ucct/bi/scratch_tmp/bi/",
     help="Absolute path to the scratch directory containing the service.",
 )
 @click.pass_context
diff --git a/bu_isciii/bioinfo_doc.py b/bu_isciii/bioinfo_doc.py
index 4654f9ede..798c0b2d4 100644
--- a/bu_isciii/bioinfo_doc.py
+++ b/bu_isciii/bioinfo_doc.py
@@ -222,7 +222,7 @@ def __init__(
     def load_versions(self):
         """Load and parse the versions.yml file."""
         result = subprocess.run(
-            f"find /data/bi/services_and_colaborations/*/*/{self.service_name} -name '*versions.yml'",
+            f"find /data/ucct/bi/services_and_colaborations/*/*/{self.service_name} -name '*versions.yml'",
             stdout=subprocess.PIPE,
             text=True,
             shell=True,
diff --git a/bu_isciii/conf/configuration.json b/bu_isciii/conf/configuration.json
index 3551c2766..123441852 100644
--- a/bu_isciii/conf/configuration.json
+++ b/bu_isciii/conf/configuration.json
@@ -1,6 +1,6 @@
 {
     "global": {
-        "data_path": "/data/bi",
+        "data_path": "/data/ucct/bi",
         "archived_path": "/archived/bi",
         "yaml_conf_path": "~/buisciii_config.yml",
         "permissions": {
diff --git a/bu_isciii/conf/configuration_dev.json b/bu_isciii/conf/configuration_dev.json
index 68e948cb5..39d0c483a 100755
--- a/bu_isciii/conf/configuration_dev.json
+++ b/bu_isciii/conf/configuration_dev.json
@@ -1,6 +1,6 @@
 {
     "global": {
-        "data_path": "tests/data/bi",
+        "data_path": "tests/data/ucct/bi",
         "archived_path": "tests/archived/bi",
         "yaml_conf_path": "~/buisciii_config.yml"
     },
diff --git a/bu_isciii/schemas/deliver_automatization.json b/bu_isciii/schemas/deliver_automatization.json
index 4ecf8e788..a586fdae7 100644
--- a/bu_isciii/schemas/deliver_automatization.json
+++ b/bu_isciii/schemas/deliver_automatization.json
@@ -4,7 +4,7 @@
   "type": "object",
   "properties": {
     "destination": {
-      "example": "/data/bi/sftp/Labvirusres",
+      "example": "/data/ucct/bi/sftp/Labvirusres",
       "description": "Folder at which the command will be executed",
       "type": "string"
     },
@@ -24,7 +24,7 @@
       "type": "string"
     },
     "source": {
-      "example": "/data/bi/services_and_colaborations/CNM/virologia/",
+      "example": "/data/ucct/bi/services_and_colaborations/CNM/virologia/",
       "description": "Folder from which the files are comming from",
       "type": "string"
     },
diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/01-preproQC/lablog b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/01-preproQC/lablog
index 0062b7b6a..a496affd5 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/01-preproQC/lablog
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/01-preproQC/lablog
@@ -4,4 +4,4 @@ mkdir logs
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --cpus-per-task 8 --time 01:00:00 --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../00-reads/"$in"_R1.fastq.gz ${scratch_dir}/../00-reads/"$in"_R2.fastq.gz &"; done > _01_rawfastqc.sh
+cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --cpus-per-task 8 --time 01:00:00 --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../00-reads/"$in"_R1.fastq.gz ${scratch_dir}/../00-reads/"$in"_R2.fastq.gz &"; done > _01_rawfastqc.sh
diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/02-preprocessing/lablog b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/02-preprocessing/lablog
index 4d355c580..2fe36a30e 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/02-preprocessing/lablog
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/02-preprocessing/lablog
@@ -1,4 +1,4 @@
 # module load singularity
 mkdir logs
-scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
-cat ../samples_id.txt | xargs -I @@ echo "mkdir @@; srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name FP.@@ --output logs/FP.@@.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/bi/pipelines/singularity-images/fastp:0.20.0--hdbcaa40_0 fastp --in1 ${scratch_dir}/../00-reads/@@_R1.fastq.gz --in2 ${scratch_dir}/../00-reads/@@_R2.fastq.gz --thread 5 --cut_front --cut_tail --cut_mean_quality 15 --qualified_quality_phred 15 --trim_poly_x --length_required 50 --detect_adapter_for_pe --json ${scratch_dir}/@@/@@_fastp.json --html ${scratch_dir}/@@/@@_fastp.html --out1 ${scratch_dir}/@@/@@_R1_filtered.fastq.gz --out2 ${scratch_dir}/@@/@@_R2_filtered.fastq.gz --unpaired1 ${scratch_dir}/@@/@@_R1_unpaired.fastq.gz --unpaired2 ${scratch_dir}/@@/@@_R2_unpaired.fastq.gz &" > _01_fastp.sh
+scratch_dir=$(echo $(pwd) | sed 's@/data/ucct/bi/scratch_tmp/@/scratch/@g')
+cat ../samples_id.txt | xargs -I @@ echo "mkdir @@; srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name FP.@@ --output logs/FP.@@.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/ucct/bi/pipelines/singularity-images/fastp:0.20.0--hdbcaa40_0 fastp --in1 ${scratch_dir}/../00-reads/@@_R1.fastq.gz --in2 ${scratch_dir}/../00-reads/@@_R2.fastq.gz --thread 5 --cut_front --cut_tail --cut_mean_quality 15 --qualified_quality_phred 15 --trim_poly_x --length_required 50 --detect_adapter_for_pe --json ${scratch_dir}/@@/@@_fastp.json --html ${scratch_dir}/@@/@@_fastp.html --out1 ${scratch_dir}/@@/@@_R1_filtered.fastq.gz --out2 ${scratch_dir}/@@/@@_R2_filtered.fastq.gz --unpaired1 ${scratch_dir}/@@/@@_R1_unpaired.fastq.gz --unpaired2 ${scratch_dir}/@@/@@_R2_unpaired.fastq.gz &" > _01_fastp.sh
diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/03-procQC/lablog b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/03-procQC/lablog
index c49d70762..2bfd95ba1 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/03-procQC/lablog
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/03-procQC/lablog
@@ -4,4 +4,4 @@ mkdir logs
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz &"; done > _01_rawfastqc.sh
+cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz &"; done > _01_rawfastqc.sh
diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
index be910a9e0..b6196b72b 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
@@ -5,7 +5,7 @@ mkdir logs
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --cpus-per-task 32 --mem 35000M --chdir $scratch_dir --time 01:00:00 --output logs/IRMA.${in}.%j.log /data/bi/pipelines/flu-amd/flu-amd-1.1.4/IRMA FLU_AD ../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz ${in} --external-config ../../../DOC/irma_config.sh &"; done > _01_irma.sh
+cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --cpus-per-task 32 --mem 35000M --chdir $scratch_dir --time 01:00:00 --output logs/IRMA.${in}.%j.log /data/ucct/bi/pipelines/flu-amd/flu-amd-1.1.4/IRMA FLU_AD ../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz ${in} --external-config ../../../DOC/irma_config.sh &"; done > _01_irma.sh
 
 echo 'bash create_irma_stats.sh' > _02_create_stats.sh
 
diff --git a/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog b/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
index 38f5edd7a..5aa86c1a4 100644
--- a/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
+++ b/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
@@ -107,7 +107,7 @@ cat <<EOF > assembly.sbatch
 # module load Nextflow/23.10.0 singularity
 export NXF_OPTS="-Xms500M -Xmx8G"
 
-nextflow run /data/bi/pipelines/nf-core-bacass/nf-core-bacass-2.3.1/main.nf \\
+nextflow run /data/ucct/bi/pipelines/nf-core-bacass/nf-core-bacass-2.4.0/2_4_0/main.nf \\
         -c ../../DOC/hpc_slurm_assembly.config \\
         -profile singularity \\
         --input samplesheet.csv \\
@@ -119,8 +119,8 @@ nextflow run /data/bi/pipelines/nf-core-bacass/nf-core-bacass-2.3.1/main.nf \\
         --fastp_args '--qualified_quality_phred 20 --cut_mean_quality 20' \\
         --skip_kraken2 true \\
         --skip_kmerfinder false \\
-        --kmerfinderdb /data/bi/references/kmerfinder/latest/bacteria \\
-        --ncbi_assembly_metadata /data/bi/references/bacteria/20240626/assembly_summary_refseq.txt \\
+        --kmerfinderdb /data/ucct/bi/references/kmerfinder/latest/bacteria \\
+        --ncbi_assembly_metadata /data/ucct/bi/references/bacteria/20240626/assembly_summary_refseq.txt \\
         ${PROKKA_ARGS} \\
         -resume
 
diff --git a/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config b/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config
index 5ef28493b..656c49f22 100644
--- a/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config
+++ b/bu_isciii/templates/assembly/DOC/hpc_slurm_assembly.config
@@ -5,7 +5,7 @@
 singularity {
         enabled                 = true
         autoMounts              = true
-        singularity.cacheDir    = '/data/bi/pipelines/singularity-images'
+        singularity.cacheDir    = '/data/ucct/bi/pipelines/singularity-images'
 }
 
 process {
diff --git a/bu_isciii/templates/blast_nt/ANALYSIS/ANALYSIS02_BLAST/lablog b/bu_isciii/templates/blast_nt/ANALYSIS/ANALYSIS02_BLAST/lablog
index 0d5496a24..cf92cc65e 100644
--- a/bu_isciii/templates/blast_nt/ANALYSIS/ANALYSIS02_BLAST/lablog
+++ b/bu_isciii/templates/blast_nt/ANALYSIS/ANALYSIS02_BLAST/lablog
@@ -6,8 +6,8 @@ mkdir logs
 # Location of assemblies to a variable so it only has to be changed here
 LOCATION=../*/*/assembly/*/*
 # Other databases: 
-# /data/bi/references/BLAST_dbs/nt_20211025/nt
-BLAST_DATABASE="/data/bi/references/virus/BLAST/all_virus.fasta"
+# /data/ucct/bi/references/BLAST_dbs/nt_20211025/nt
+BLAST_DATABASE="/data/ucct/bi/references/BLAST_dbs/viral_ncbi/viral_genomes_ncbi"
 
 # if there are scaffolds, uncompress the scaffolds in its dir (zcat for decompression)
 # if there contigs and no scaffolds, uncompress the contigs as scaffolds in its dir
@@ -27,7 +27,7 @@ cat ../samples_id.txt | while read in; do
 done 
 
 # NOTE3: change the -query flag to meet your requirements
-cat ../samples_id.txt | xargs -I %% echo "srun --chdir ${scratch_dir} --partition middle_idx --mem 200G --time 48:00:00 --cpus-per-task 10 --output logs/BLASTN_%%_%j.log --job-name BLASTN_%% singularity exec -B ${scratch_dir}/../../ -B /data/bi/references/virus/BLAST/ /data/bi/pipelines/singularity-images/blast:2.11.0--pl5262h3289130_1 blastn -num_threads 10 -db ${BLAST_DATABASE} -query ${scratch_dir}/%%/%%.scaffolds.fa -out ${scratch_dir}/%%/%%_blast.tsv -outfmt '6 qseqid stitle qaccver saccver pident length mismatch gaps qstart qend sstart send evalue bitscore slen qlen qcovs' &" > _01_blast.sh
+cat ../samples_id.txt | xargs -I %% echo "srun --chdir ${scratch_dir} --partition middle_idx --mem 200G --time 48:00:00 --cpus-per-task 10 --output logs/BLASTN_%%_%j.log --job-name BLASTN_%% singularity exec -B ${scratch_dir}/../../ -B /data/ucct/bi/references/BLAST_dbs/viral_ncbi/ /data/ucct/bi/pipelines/singularity-images/blast:2.11.0--pl5262h3289130_1 blastn -num_threads 10 -db ${BLAST_DATABASE} -query ${scratch_dir}/%%/%%.scaffolds.fa -out ${scratch_dir}/%%/%%_blast.tsv -outfmt '6 qseqid stitle qaccver saccver pident length mismatch gaps qstart qend sstart send evalue bitscore slen qlen qcovs' &" > _01_blast.sh
 
 # Filtering criteria:
     # %refCovered > 0.7
@@ -71,5 +71,5 @@ echo "rm header" >> _03_gather_results_add_header.sh
 # 20: %refCovered: length/slen
 
 # conda activate 2excel
-cat ../samples_id.txt | xargs -I %% echo "srun --chdir ${scratch_dir} --partition short_idx --mem 10G --time 1:00:00 --output logs/2excel_%%.log --job-name 2excel_%% python /data/bi/pipelines/utilities/export_excel_from_csv.py --input_file %%/%%_blast_filt.tsv --delimiter '\t' --output_filename %%/%%_blast_filt --it_has_index --it_has_header" > _04_to_excel.sh
-echo "srun --chdir ${scratch_dir} --partition short_idx --mem 10G --time 1:00:00 --output logs/2excel_all.log --job-name 2excel_all python /data/bi/pipelines/utilities/export_excel_from_csv.py --input_file all_samples_filtered_BLAST_results.tsv --delimiter '\t' --output_filename all_samples_filtered_BLAST_results --it_has_index --it_has_header" >> _04_to_excel.sh
+cat ../samples_id.txt | xargs -I %% echo "srun --chdir ${scratch_dir} --partition short_idx --mem 10G --time 1:00:00 --output logs/2excel_%%.log --job-name 2excel_%% python /data/ucct/bi/pipelines/utilities/export_excel_from_csv.py --input_file %%/%%_blast_filt.tsv --delimiter '\t' --output_filename %%/%%_blast_filt --it_has_index --it_has_header" > _04_to_excel.sh
+echo "srun --chdir ${scratch_dir} --partition short_idx --mem 10G --time 1:00:00 --output logs/2excel_all.log --job-name 2excel_all python /data/ucct/bi/pipelines/utilities/export_excel_from_csv.py --input_file all_samples_filtered_BLAST_results.tsv --delimiter '\t' --output_filename all_samples_filtered_BLAST_results --it_has_index --it_has_header" >> _04_to_excel.sh
diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/01-preprocessing/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/01-preprocessing/lablog
index d1d3eb738..86a727548 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/01-preprocessing/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/01-preprocessing/lablog
@@ -19,8 +19,8 @@ read -p $'\e[1;37mDid you save the trimmed reads from previous assembly pipeline
         echo "Preparing _01_fastp.sh file for trimming..."
         
         mkdir logs
-        scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
-        cat ../samples_id.txt | xargs -I @@ echo "mkdir @@; srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name FP.@@ --output logs/FP.@@.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/bi/pipelines/singularity-images/fastp:0.20.0--hdbcaa40_0 fastp --in1 ${scratch_dir}/../00-reads/@@_R1.fastq.gz --in2 ${scratch_dir}/../00-reads/@@_R2.fastq.gz --thread 5 --cut_front --cut_tail --cut_mean_quality 15 --qualified_quality_phred 15 --trim_poly_x --length_required 50 --detect_adapter_for_pe --json ${scratch_dir}/@@/@@_fastp.json --html ${scratch_dir}/@@/@@_fastp.html --out1 ${scratch_dir}/@@/@@_R1_filtered.fastq.gz --out2 ${scratch_dir}/@@/@@_R2_filtered.fastq.gz --unpaired1 ${scratch_dir}/@@/@@_R1_unpaired.fastq.gz --unpaired2 ${scratch_dir}/@@/@@_R2_unpaired.fastq.gz &" > _01_fastp.sh
+        scratch_dir=$(echo $(pwd) | sed 's@/data/ucct/bi/scratch_tmp/@/scratch/@g')
+        cat ../samples_id.txt | xargs -I @@ echo "mkdir @@; srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name FP.@@ --output logs/FP.@@.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/ucct/bi/pipelines/singularity-images/fastp:0.20.0--hdbcaa40_0 fastp --in1 ${scratch_dir}/../00-reads/@@_R1.fastq.gz --in2 ${scratch_dir}/../00-reads/@@_R2.fastq.gz --thread 5 --cut_front --cut_tail --cut_mean_quality 15 --qualified_quality_phred 15 --trim_poly_x --length_required 50 --detect_adapter_for_pe --json ${scratch_dir}/@@/@@_fastp.json --html ${scratch_dir}/@@/@@_fastp.html --out1 ${scratch_dir}/@@/@@_R1_filtered.fastq.gz --out2 ${scratch_dir}/@@/@@_R2_filtered.fastq.gz --unpaired1 ${scratch_dir}/@@/@@_R1_unpaired.fastq.gz --unpaired2 ${scratch_dir}/@@/@@_R2_unpaired.fastq.gz &" > _01_fastp.sh
 
 	echo -e "\e[32mFile _01_fastp.sh ready.\e[0m"
 
diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/lablog
index 4debfbd21..9414e3342 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/lablog
@@ -1,3 +1,3 @@
 # module load singularity
 
-cp /data/bi/references/ariba/databases.txt .
+cp /data/ucct/bi/references/ariba/databases.txt .
diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/run/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/run/lablog
index 1bfc20c02..f31e7ae2f 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/run/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/run/lablog
@@ -9,8 +9,8 @@ join -j 2 ../../samples_id.txt ../databases.txt | sed 's/^ //g' > sample_databas
 
 # col 1 (arr[0]): sample
 # col 2 (arr[1]): database
-cat sample_database.txt | grep -v 'pubmlst' | while read in; do arr=($in); echo "mkdir -p ${arr[0]}; srun --chdir $scratch_dir --output logs/ARIBA_${arr[0]}_${arr[1]}.%j.log --job-name ARIBA_${arr[0]}_${arr[1]} --cpus-per-task 5 --mem 5G --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../../ -B /data/bi/references/ariba/ /data/bi/pipelines/singularity-images/ariba:2.14.6--py39heaaa4ec_6 ariba run /data/bi/references/ariba/latest/${arr[1]}/out.${arr[1]}.prepareref ${scratch_dir}/../../01-preprocessing/${arr[0]}/${arr[0]}_R1_filtered.fastq.gz ${scratch_dir}/../../01-preprocessing/${arr[0]}/${arr[0]}_R2_filtered.fastq.gz ${scratch_dir}/${arr[0]}/out_${arr[1]}_${arr[0]}_run &"; done > _01_ariba.sh
+cat sample_database.txt | grep -v 'pubmlst' | while read in; do arr=($in); echo "mkdir -p ${arr[0]}; srun --chdir $scratch_dir --output logs/ARIBA_${arr[0]}_${arr[1]}.%j.log --job-name ARIBA_${arr[0]}_${arr[1]} --cpus-per-task 5 --mem 5G --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../../ -B /data/ucct/bi/references/ariba/ /data/ucct/bi/pipelines/singularity-images/ariba:2.14.6--py39heaaa4ec_6 ariba run /data/ucct/bi/references/ariba/latest/${arr[1]}/out.${arr[1]}.prepareref ${scratch_dir}/../../01-preprocessing/${arr[0]}/${arr[0]}_R1_filtered.fastq.gz ${scratch_dir}/../../01-preprocessing/${arr[0]}/${arr[0]}_R2_filtered.fastq.gz ${scratch_dir}/${arr[0]}/out_${arr[1]}_${arr[0]}_run &"; done > _01_ariba.sh
 
-cat ../../../samples_id.txt | while read in; do echo "mkdir -p $in; srun --chdir $scratch_dir --output logs/ARIBA_${in}_pubmlst.%j.log --job-name ARIBA_${in}_pubmlst --cpus-per-task 5 --mem 5G --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../../ /data/bi/pipelines/singularity-images/ariba:2.14.6--py39heaaa4ec_6 ariba run ${scratch_dir}/${downloaded_ref} ${scratch_dir}/../../01-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../../01-preprocessing/${in}/${in}_R2_filtered.fastq.gz ${scratch_dir}/${in}/out_pubmlst_${in}_run &"; done >> _01_ariba.sh
+cat ../../../samples_id.txt | while read in; do echo "mkdir -p $in; srun --chdir $scratch_dir --output logs/ARIBA_${in}_pubmlst.%j.log --job-name ARIBA_${in}_pubmlst --cpus-per-task 5 --mem 5G --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../../ /data/ucct/bi/pipelines/singularity-images/ariba:2.14.6--py39heaaa4ec_6 ariba run ${scratch_dir}/${downloaded_ref} ${scratch_dir}/../../01-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../../01-preprocessing/${in}/${in}_R2_filtered.fastq.gz ${scratch_dir}/${in}/out_pubmlst_${in}_run &"; done >> _01_ariba.sh
 
 cat sample_database.txt | while read in; do arr=($in); echo "mv ${arr[0]}/out_${arr[1]}_${arr[0]}_run/report.tsv ${arr[0]}/out_${arr[1]}_${arr[0]}_run/${arr[0]}_${arr[1]}_report.tsv"; done > _02_fix_tsvreport.sh
diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/summary/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/summary/lablog
index af5821ad1..baf447a80 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/summary/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/summary/lablog
@@ -8,4 +8,4 @@ scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
 # 1 - Use the ls in parenthesis to find the reports for a certain db, and xargs to make it into a single line
 # 2 - Integrate this into the ariba summary command
 
-cat ../databases.txt | while read in; do echo "srun --chdir $scratch_dir --output logs/ARIBA_SUMMARY_${in}.log --job-name ARIBA_${in} --cpus-per-task 5 --mem 5G --partition short_idx --time 00:30:00 singularity exec -B ${scratch_dir}/../../../../ /data/bi/pipelines/singularity-images/ariba:2.14.6--py36h4aaaa08_3 ariba summary --cluster_cols ref_seq,match out_summary_${in} $(ls ${scratch_dir}/../run/*/out*_${in}*/*${in}*_report.tsv | xargs) &"; done > _01_ariba_summary_prueba.sh
+cat ../databases.txt | while read in; do echo "srun --chdir $scratch_dir --output logs/ARIBA_SUMMARY_${in}.log --job-name ARIBA_${in} --cpus-per-task 5 --mem 5G --partition short_idx --time 00:30:00 singularity exec -B ${scratch_dir}/../../../../ /data/ucct/bi/pipelines/singularity-images/ariba:2.14.6--py36h4aaaa08_3 ariba summary --cluster_cols ref_seq,match out_summary_${in} $(ls ${scratch_dir}/../run/*/out*_${in}*/*${in}*_report.tsv | xargs) &"; done > _01_ariba_summary_prueba.sh
diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog
index a8694b065..2f002ce77 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/03-amrfinderplus/lablog
@@ -2,7 +2,7 @@
 
 # Only works with assemblies, prior to this you must have executed assembly pipeline
 
-scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
+scratch_dir=$(echo $(pwd) | sed 's@/data/ucct/bi/scratch_tmp/@/scratch/@g')
 
 mkdir logs	
 
diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
index 342dcfbda..fd126538b 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
@@ -53,14 +53,14 @@ cat <<EOF > _01_emmtyper.sbatch
 # create results folder
 mkdir -p 01-typing
 mkdir -p 01-typing/tmps
-blastdb_path=/data/bi/references/cdc_emm_blastdb/20240509
+blastdb_path=/data/ucct/bi/references/cdc_emm_blastdb/20240509
 
 # Run emmtyper
 singularity exec \\
     --bind ${scratch_dir} \\
     --bind ${scratch_dir}/../../ \\
     --bind  \$blastdb_path \\
-    /data/bi/pipelines/singularity-images/singularity-emmtyper.0.2.0--py_0 emmtyper \\
+    /data/ucct/bi/pipelines/singularity-images/singularity-emmtyper.0.2.0--py_0 emmtyper \\
     -w blast \\
     --keep \\
     --blast_db "\${blastdb_path}/cdc_emm_database" \\
diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/05-mlva/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/05-mlva/lablog
index fb6159b6b..742bf830d 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/05-mlva/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/05-mlva/lablog
@@ -3,10 +3,10 @@
 mkdir logs
 mkdir assemblies
 mkdir MLVA_output
-scratch_dir=$(pwd | sed 's|/data/bi/scratch_tmp|/scratch|g')
+scratch_dir=$(pwd | sed 's|/data/ucct/bi/scratch_tmp|/scratch|g')
 cp ../../*_ASSEMBLY/03-assembly/unicycler/*.fasta* assemblies/
 gzip -d assemblies/*.fasta.gz
-available_primers=$(ls /data/bi/references/MLVA/*primer* | rev | cut -d "/" -f1 | rev | cut -d "_" -f1)
+available_primers=$(ls /data/ucct/bi/references/MLVA/*primer* | rev | cut -d "/" -f1 | rev | cut -d "_" -f1)
 
 echo "Available primers:"
 select primer in $available_primers; do
@@ -18,6 +18,6 @@ select primer in $available_primers; do
     fi
 done
 
-primer_file=$(ls /data/bi/references/MLVA/${primer}*)
+primer_file=$(ls /data/ucct/bi/references/MLVA/${primer}*)
 
-echo "srun --partition short_idx --chdir ${scratch_dir} --output logs/MLVA.log --job-name MLVA python /data/bi/pipelines/mlva/MLVA_finder.py -c -i assemblies -o MLVA_output -p ${primer_file} --full-locus-name --predicted-PCR-size-table --flanking-seq 20 &"  > _01_mlva.sh
+echo "srun --partition short_idx --chdir ${scratch_dir} --output logs/MLVA.log --job-name MLVA python /data/ucct/bi/pipelines/mlva/MLVA_finder.py -c -i assemblies -o MLVA_output -p ${primer_file} --full-locus-name --predicted-PCR-size-table --flanking-seq 20 &"  > _01_mlva.sh
diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/99-stats/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/99-stats/lablog
index 6e11ee3d9..8a911309c 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/99-stats/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/99-stats/lablog
@@ -1,6 +1,6 @@
 #conda activate python3
-python3 /data/bi/pipelines/bacterial-qc/parse_ariba.py --path ../02-ariba/summary/out_summary_card.csv --database card --output_bn ariba_card.bn --output_csv ariba_card.csv
-python3 /data/bi/pipelines/bacterial-qc/parse_ariba.py --path ../02-ariba/summary/out_summary_plasmidfinder.csv --database plasmidfinder --output_bn ariba_plasmidfinder.bn --output_csv ariba_plasmidfinder.csv
-python3 /data/bi/pipelines/bacterial-qc/parse_ariba.py --path ../02-ariba/summary/out_summary_vfdb_full.csv --database vfdb_full --output_bn ariba_vfdb_full.bn --output_csv ariba_vfdb_full.csv
+python3 /data/ucct/bi/pipelines/bacterial-qc/parse_ariba.py --path ../02-ariba/summary/out_summary_card.csv --database card --output_bn ariba_card.bn --output_csv ariba_card.csv
+python3 /data/ucct/bi/pipelines/bacterial-qc/parse_ariba.py --path ../02-ariba/summary/out_summary_plasmidfinder.csv --database plasmidfinder --output_bn ariba_plasmidfinder.bn --output_csv ariba_plasmidfinder.csv
+python3 /data/ucct/bi/pipelines/bacterial-qc/parse_ariba.py --path ../02-ariba/summary/out_summary_vfdb_full.csv --database vfdb_full --output_bn ariba_vfdb_full.bn --output_csv ariba_vfdb_full.csv
 
 paste <(echo "sample_id") <(cat ../02-ariba/run/*/out_pubmlst_*_run/mlst_report.tsv | head -n1) > ariba_mlst_full.tsv; cat ../samples_id.txt | while read in; do paste <(echo ${in}) <(tail -n1 ../02-ariba/run/${in}/out_pubmlst_${in}_run/mlst_report.tsv); done >> ariba_mlst_full.tsv
diff --git a/bu_isciii/templates/characterization/REFERENCES/lablog b/bu_isciii/templates/characterization/REFERENCES/lablog
index 673c7904d..8bce3e9ee 100644
--- a/bu_isciii/templates/characterization/REFERENCES/lablog
+++ b/bu_isciii/templates/characterization/REFERENCES/lablog
@@ -2,7 +2,7 @@
 
 mkdir logs
 
-scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
+scratch_dir=$(echo $(pwd) | sed 's@/data/ucct/bi/scratch_tmp/@/scratch/@g')
 
 # Function to print colored text
 print_color() {
@@ -31,12 +31,12 @@ print_color "This will take some seconds to display, please wait" 'blue'
 
 # Select genome from PMLST
 IFS=$'\n'
-bacterial_options=( $(singularity exec /data/bi/pipelines/singularity-images/ariba:2.14.6--py39heaaa4ec_6 ariba pubmlstspecies | sed 's/^/"/g' | sed 's/$/"/g') )
+bacterial_options=( $(singularity exec /data/ucct/bi/pipelines/singularity-images/ariba:2.14.6--py39heaaa4ec_6 ariba pubmlstspecies | sed 's/^/"/g' | sed 's/$/"/g') )
 print_color "Indicate the preferred bacterial genome:" 'blue'
 select BACTERIA in "${bacterial_options[@]}"; do
     if [ -n "$BACTERIA" ]; then
         print_color "Selected bacteria: $BACTERIA" 'green'
-        echo "srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name PUBMLSTGET --output logs/PUBMLSTGET.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir} /data/bi/pipelines/singularity-images/ariba:2.14.6--py39heaaa4ec_6 ariba pubmlstget $BACTERIA $(date '+%Y%m%d') &" > _01_download_pubmlst.sh
+        echo "srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name PUBMLSTGET --output logs/PUBMLSTGET.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir} /data/ucct/bi/pipelines/singularity-images/ariba:2.14.6--py39heaaa4ec_6 ariba pubmlstget $BACTERIA $(date '+%Y%m%d') &" > _01_download_pubmlst.sh
         break
     else
         print_color "Invalid input. Please select a valid option." 'red'
diff --git a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog
index 32414d09b..0c971e16e 100644
--- a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog
+++ b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog
@@ -6,17 +6,17 @@ scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
 mkdir -p logs
 
-echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/SELECTSNPS.log --job-name SELECTSNPS singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk SelectVariants \
+echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/SELECTSNPS.log --job-name SELECTSNPS singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk SelectVariants \
      -V ${scratch_dir}/../01-sarek/variant_calling/haplotypecaller/joint_variant_calling/joint_germline.vcf.gz \
      -select-type SNP \
      -O ${scratch_dir}/snps.vcf.gz &" > _01_separate_snps_indels.sh
 
-echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/SELECTINDELS.log --job-name SELECTINDELS singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk SelectVariants \
+echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/SELECTINDELS.log --job-name SELECTINDELS singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk SelectVariants \
     -V ${scratch_dir}/../01-sarek/variant_calling/haplotypecaller/joint_variant_calling/joint_germline.vcf.gz \
     -select-type INDEL \
     -O ${scratch_dir}/indels.vcf.gz &" >> _01_separate_snps_indels.sh
 
-echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/FILSNP.log --job-name FILSNP singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk VariantFiltration \
+echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/FILSNP.log --job-name FILSNP singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk VariantFiltration \
 	-V ${scratch_dir}/snps.vcf.gz \
 	-filter 'QD < 2.0' --filter-name 'QD2' \
 	-filter 'QUAL < 30.0' --filter-name 'QUAL30' \
@@ -27,7 +27,7 @@ echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output
 	-filter 'ReadPosRankSum < -8.0' --filter-name 'ReadPosRankSum-8' \
 	-O ${scratch_dir}/snps_filtered.vcf.gz &" > _02_filter.sh
 
-echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/FILINDEL.log --job-name FILINDEL singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk VariantFiltration \
+echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/FILINDEL.log --job-name FILINDEL singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk VariantFiltration \
 	-V ${scratch_dir}/indels.vcf.gz \
 	-filter 'QD < 2.0' --filter-name 'QD2' \
 	-filter 'QUAL < 30.0' --filter-name 'QUAL30' \
@@ -35,7 +35,7 @@ echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output
 	-filter 'ReadPosRankSum < -20.0' --filter-name 'ReadPosRankSum-20' \
 	-O ${scratch_dir}/indels_filtered.vcf.gz &" >> _02_filter.sh
 
-echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/MERGEVCF.log --job-name MERGEVCF singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk MergeVcfs \
+echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/MERGEVCF.log --job-name MERGEVCF singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk MergeVcfs \
 	-I ${scratch_dir}/snps_filtered.vcf.gz \
 	-I ${scratch_dir}/indels_filtered.vcf.gz \
 	-O ${scratch_dir}/variants_fil.vcf.gz &" > _03_merge_vcfs.sh
diff --git a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
index ef8d93adb..45b655319 100644
--- a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
+++ b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
@@ -3,7 +3,7 @@
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-ln -s /data/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37/dbNSFP_ENSG_gene_GRCh37.txt .
+ln -s /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37/dbNSFP_ENSG_gene_GRCh37.txt .
 mkdir -p vep
 mkdir -p exomiser
 mkdir -p logs
@@ -15,14 +15,14 @@ echo "sed -i 's/\t$//' ./vep/variants_fil_mod.vcf" >> _01_bcftools_query.sh
 
 # 2-3. Create variant table.
 
-echo "singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/bcftools:1.12--h45bccc9_1 bcftools query -H -f '%CHROM\t%POS\t%ID\t%REF\t%ALT\t%FILTER\t[%GT\t%DP\t%AD\t%GQ\t]\n' ${scratch_dir}/vep/variants_fil_mod.vcf > ${scratch_dir}/vep/variants.table" >> _01_bcftools_query.sh
+echo "singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/bcftools:1.12--h45bccc9_1 bcftools query -H -f '%CHROM\t%POS\t%ID\t%REF\t%ALT\t%FILTER\t[%GT\t%DP\t%AD\t%GQ\t]\n' ${scratch_dir}/vep/variants_fil_mod.vcf > ${scratch_dir}/vep/variants.table" >> _01_bcftools_query.sh
 echo "sed -i -r 's/(#|\[[0-9]+\])//g' ./vep/variants.table;sed -i 's/:/_/g' ./vep/variants.table;sed -i 's/ //g' ./vep/variants.table;sed -i 's/\t*$//g' ./vep/variants.table" >> _01_bcftools_query.sh
 
 echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/BCFTOOLSQUERY.log --job-name BCFTOOLSQUERY bash ./_01_bcftools_query.sh &" > _01_run_bcftools_query.sh
 
 ## 4-5. Lablog for annotating whole genome samples using Variant Effect Predictor (VEP).
 
-echo "srun --partition short_idx --mem 100G --time 4:00:00 --chdir ${scratch_dir} --output logs/VEP.log --job-name VEP singularity exec -B /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/ -B /data/bi/references/eukaria/homo_sapiens/cache_vep/homo_sapiens -B /data/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37/ -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/ensembl-vep:103.1--pl5262h4a94de4_2 vep --fasta /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta -i ${scratch_dir}/vep/variants_fil_mod.vcf -o ${scratch_dir}/vep/vep_annot.vcf --cache --offline --dir_cache /data/bi/references/eukaria/homo_sapiens/cache_vep/ --everything --dir_plugins /data/bi/references/eukaria/homo_sapiens/cache_vep/Plugins/ --assembly GRCh37 --tab --plugin dbNSFP,/data/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37/dbNSFP4.1a_grch37.gz,clinvar_id,clinvar_trait,clinvar_OMIM_id,clinvar_Orphanet_id,HGVSc_snpEff,HGVSp_snpEff,SIFT_score,SIFT_pred,Polyphen2_HDIV_score,Polyphen2_HDIV_pred,Polyphen2_HVAR_score,Polyphen2_HVAR_pred,MutationTaster_score,MutationTaster_pred,MutationAssessor_score,MutationAssessor_pred,FATHMM_score,FATHMM_pred,PROVEAN_score,PROVEAN_pred,VEST4_score,MetaSVM_score,MetaSVM_pred,MetaLR_score,MetaLR_pred,CADD_raw,CADD_phred,CADD_raw_hg19,CADD_phred_hg19,GERP++_NR,GERP++_RS,phyloP100way_vertebrate,phastCons100way_vertebrate &" > _02_vep_annotation.sh
+echo "srun --partition short_idx --mem 100G --time 4:00:00 --chdir ${scratch_dir} --output logs/VEP.log --job-name VEP singularity exec -B /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/ -B /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/homo_sapiens -B /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37/ -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/ensembl-vep:103.1--pl5262h4a94de4_2 vep --fasta /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta -i ${scratch_dir}/vep/variants_fil_mod.vcf -o ${scratch_dir}/vep/vep_annot.vcf --cache --offline --dir_cache /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/ --everything --dir_plugins /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/Plugins/ --assembly GRCh37 --tab --plugin dbNSFP,/data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37/dbNSFP4.1a_grch37.gz,clinvar_id,clinvar_trait,clinvar_OMIM_id,clinvar_Orphanet_id,HGVSc_snpEff,HGVSp_snpEff,SIFT_score,SIFT_pred,Polyphen2_HDIV_score,Polyphen2_HDIV_pred,Polyphen2_HVAR_score,Polyphen2_HVAR_pred,MutationTaster_score,MutationTaster_pred,MutationAssessor_score,MutationAssessor_pred,FATHMM_score,FATHMM_pred,PROVEAN_score,PROVEAN_pred,VEST4_score,MetaSVM_score,MetaSVM_pred,MetaLR_score,MetaLR_pred,CADD_raw,CADD_phred,CADD_raw_hg19,CADD_phred_hg19,GERP++_NR,GERP++_RS,phyloP100way_vertebrate,phastCons100way_vertebrate &" > _02_vep_annotation.sh
 
 echo "grep -v '^##' ./vep/vep_annot.vcf > ./vep/vep_annot_head.txt" > _03_merge_data1.sh
 echo "sed -i 's/#Uploaded_variation/ID/' ./vep/vep_annot_head.txt" >> _03_merge_data1.sh
@@ -49,7 +49,7 @@ sed -i "s|OUTPUT_FOLDER|${output_folder}|g" ./exomiser_configfile.yml
 
 # THE FILE "spring.log" MUST BE DELETED IN THE CORRESPONDING NODE
 echo "java -Xms2g -Xmx4g -jar exomiser-cli-13.0.0.jar --analysis ${scratch_dir}/exomiser_configfile.yml; rm /tmp/spring.log" > aux_06_exomiser_exome.sh
-echo "srun --partition short_idx --mem 100G --time 2:00:00 --chdir /data/bi/pipelines/exomiser/exomiser-cli-13.0.0 --output logs/EXOMISER.log --job-name EXOMISER bash ${scratch_dir}/aux_06_exomiser_exome.sh &" > _06_exomiser_exome.sh
+echo "srun --partition short_idx --mem 100G --time 2:00:00 --chdir /data/ucct/bi/pipelines/exomiser/exomiser-cli-13.0.0 --output logs/EXOMISER.log --job-name EXOMISER bash ${scratch_dir}/aux_06_exomiser_exome.sh &" > _06_exomiser_exome.sh
 
 # annot_all table is huge, lets shrink it a little bit
 echo "srun --partition short_idx --chdir ${scratch_dir} --output logs/COMPRESS_ALL.log --job-name COMPRESS_ANNOT_ALL gzip variants_annot_all.tab &" >> _07_gzip_table.sh
diff --git a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog
index 5dd4320a0..f78ff9400 100644
--- a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog
+++ b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog
@@ -3,7 +3,7 @@
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 mkdir logs
 
-cat ../samples_id.txt | xargs -I @@ echo "srun --partition short_idx --mem 100G --time 2:00:00 --chdir ${scratch_dir} --output logs/PICARDHSMETRICS.@@.%j.log --job-name PICARDHSMETRICS singularity exec -B ${scratch_dir}/../../../ -B /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome /data/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectHsMetrics -R /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37_decoy.fasta -BI ${scratch_dir}/../../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37.interval_list -TI ${scratch_dir}/../../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37.interval_list -I ${scratch_dir}/../01-sarek/preprocessing/recalibrated/@@/@@.recal.cram -O ${scratch_dir}/@@_hsMetrics.out -VALIDATION_STRINGENCY LENIENT &" > _01_picardHsMetrics.sh
+cat ../samples_id.txt | xargs -I @@ echo "srun --partition short_idx --mem 100G --time 2:00:00 --chdir ${scratch_dir} --output logs/PICARDHSMETRICS.@@.%j.log --job-name PICARDHSMETRICS singularity exec -B ${scratch_dir}/../../../ -B /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome /data/ucct/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectHsMetrics -R /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37_decoy.fasta -BI ${scratch_dir}/../../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37.interval_list -TI ${scratch_dir}/../../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37.interval_list -I ${scratch_dir}/../01-sarek/preprocessing/recalibrated/@@/@@.recal.cram -O ${scratch_dir}/@@_hsMetrics.out -VALIDATION_STRINGENCY LENIENT &" > _01_picardHsMetrics.sh
 
 echo "echo "\"SAMPLE\",\"MEAN TARGET COVERAGE\", \"PCT USABLE BASES ON TARGET\",\"FOLD ENRICHMENT\",\"PCT TARGET BASES 10X\",\"PCT TARGET BASES 20X\",\"PCT TARGET BASES 30X\",\"PCT TARGET BASES 40X\",\"PCT TARGET BASES 50X\"" > hsMetrics_all.out" > _02_hsMetrics_all.sh
 cat ../samples_id.txt | xargs -I % echo "grep '^Illumin' %_hsMetrics.out | awk 'BEGIN{FS=\"\\t\";OFS=\",\"}{print \"%\",\$34,\$12,\$13,\$48,\$49,\$50,\$51,\$52}' >> hsMetrics_all.out" >> _02_hsMetrics_all.sh
diff --git a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/lablog b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/lablog
index edc5cd0eb..e8ca5a5b3 100755
--- a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/lablog
+++ b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/lablog
@@ -28,17 +28,17 @@ cat <<EOF > sarek.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/nf-core-sarek/nf-core-sarek_3.4.4/3_4_4/main.nf \\
+nextflow run /data/ucct/bi/pipelines/nf-core-sarek/nf-core-sarek_3.4.4/3_4_4/main.nf \\
 	-c ../../DOC/hpc_slurm_sarek.config \\
 	--input 'samplesheet.csv' \\
 	--outdir 01-sarek \\
 	--genome GATK.GRCh37 \\
 	--wes \\
 	--intervals '../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37_mod.bed' \\
-	--dbsnp '/data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/variants/20131208/dbsnp_138_mod.b37.vcf.gz' \\
-	--dbsnp_tbi '/data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/variants/20131208/dbsnp_138_mod.b37.vcf.gz.tbi' \\
+	--dbsnp '/data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/variants/20131208/dbsnp_138_mod.b37.vcf.gz' \\
+	--dbsnp_tbi '/data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/variants/20131208/dbsnp_138_mod.b37.vcf.gz.tbi' \\
 	--igenomes_ignore \\
-	--igenomes_base '/data/bi/references/igenomes/' \\
+	--igenomes_base '/data/ucct/bi/references/igenomes/' \\
 	--tools 'haplotypecaller' \\
 	--joint_germline \\
 	-resume
diff --git a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog
index e1afcc7f2..e366b6d35 100644
--- a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog
+++ b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog
@@ -7,17 +7,17 @@ scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
 mkdir -p logs
 
-echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/SELECTSNPS.log --job-name SELECTSNPS singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk SelectVariants \
+echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/SELECTSNPS.log --job-name SELECTSNPS singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk SelectVariants \
      -V ${scratch_dir}/../01-sarek/variant_calling/haplotypecaller/joint_variant_calling/joint_germline.vcf.gz \
      -select-type SNP \
      -O ${scratch_dir}/snps.vcf.gz &" > _01_separate_snps_indels.sh
 
-echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/SELECTINDELS.log --job-name SELECTINDELS singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk SelectVariants \
+echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/SELECTINDELS.log --job-name SELECTINDELS singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk SelectVariants \
     -V ${scratch_dir}/../01-sarek/variant_calling/haplotypecaller/joint_variant_calling/joint_germline.vcf.gz \
     -select-type INDEL \
     -O ${scratch_dir}/indels.vcf.gz &" >> _01_separate_snps_indels.sh
 
-echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/FILSNP.log --job-name FILSNP singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk VariantFiltration \
+echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/FILSNP.log --job-name FILSNP singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk VariantFiltration \
 	-V ${scratch_dir}/snps.vcf.gz \
 	-filter 'QD < 2.0' --filter-name 'QD2' \
 	-filter 'QUAL < 30.0' --filter-name 'QUAL30' \
@@ -28,7 +28,7 @@ echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output
 	-filter 'ReadPosRankSum < -8.0' --filter-name 'ReadPosRankSum-8' \
 	-O ${scratch_dir}/snps_filtered.vcf.gz &" > _02_filter.sh
 
-echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/FILINDEL.log --job-name FILINDEL singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk VariantFiltration \
+echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/FILINDEL.log --job-name FILINDEL singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk VariantFiltration \
 	-V ${scratch_dir}/indels.vcf.gz \
 	-filter 'QD < 2.0' --filter-name 'QD2' \
 	-filter 'QUAL < 30.0' --filter-name 'QUAL30' \
@@ -36,7 +36,7 @@ echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output
 	-filter 'ReadPosRankSum < -20.0' --filter-name 'ReadPosRankSum-20' \
 	-O ${scratch_dir}/indels_filtered.vcf.gz &" >> _02_filter.sh
 
-echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/MERGEVCF.log --job-name MERGEVCF singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk MergeVcfs \
+echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/MERGEVCF.log --job-name MERGEVCF singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk MergeVcfs \
 	-I ${scratch_dir}/snps_filtered.vcf.gz \
 	-I ${scratch_dir}/indels_filtered.vcf.gz \
 	-O ${scratch_dir}/variants_fil.vcf.gz &" > _03_merge_vcfs.sh
diff --git a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
index e771e6dcd..5017cb561 100644
--- a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
+++ b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
@@ -3,8 +3,8 @@
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-ln -s /data/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37-4.3/dbNSFP_ENSG_gene_GRCh37.txt
-ln -s /data/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37-4.3/dbNSFP_ENSG_plugin_hg19.txt
+ln -s /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37-4.3/dbNSFP_ENSG_gene_GRCh37.txt
+ln -s /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37-4.3/dbNSFP_ENSG_plugin_hg19.txt
 
 mkdir -p vep
 mkdir -p exomiser
@@ -18,7 +18,7 @@ echo "sed -i 's/\t$//' ./vep/variants_fil_mod.vcf" >> aux_01_bcftools_query.sh
 
 # 2. Create variant table.
 
-echo "singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/bcftools:1.12--h45bccc9_1 bcftools query -H -f '%CHROM\t%POS\t%ID\t%REF\t%ALT\t%FILTER\t[%GT\t%DP\t%AD\t%GQ\t]\n' ${scratch_dir}/vep/variants_fil_mod.vcf > ${scratch_dir}/vep/variants.table" >> aux_01_bcftools_query.sh
+echo "singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/bcftools:1.12--h45bccc9_1 bcftools query -H -f '%CHROM\t%POS\t%ID\t%REF\t%ALT\t%FILTER\t[%GT\t%DP\t%AD\t%GQ\t]\n' ${scratch_dir}/vep/variants_fil_mod.vcf > ${scratch_dir}/vep/variants.table" >> aux_01_bcftools_query.sh
 echo "sed -i -r 's/(#|\[[0-9]+\])//g' ./vep/variants.table;sed -i 's/:/_/g' ./vep/variants.table;sed -i 's/ //g' ./vep/variants.table;sed -i 's/\t*$//g' ./vep/variants.table " >> aux_01_bcftools_query.sh
 
 echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/BCFTOOLSQUERY.log --job-name BCFTOOLSQUERY bash ./aux_01_bcftools_query.sh &" > _01_run_bcftools_query.sh
@@ -28,7 +28,7 @@ echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output
 # 3. Lablog for annotating whole genome samples using Variant Effect Predictor (VEP).
 # Run Vep without the plugin columns
 
-echo "srun --partition short_idx --mem 100G --time 12:00:00 --chdir ${scratch_dir} --output logs/VEP.log --job-name VEP singularity exec -B /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome -B /data/bi/references/eukaria/homo_sapiens/cache_vep -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/ensembl-vep:103.1--pl5262h4a94de4_2 vep --fasta /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta -i ${scratch_dir}/vep/variants_fil_mod.vcf -o ${scratch_dir}/vep/vep_annot.vcf --cache --offline --dir_cache /data/bi/references/eukaria/homo_sapiens/cache_vep/ --everything --assembly GRCh37 --tab &" > _02_vep_annotation.sh
+echo "srun --partition short_idx --mem 100G --time 12:00:00 --chdir ${scratch_dir} --output logs/VEP.log --job-name VEP singularity exec -B /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome -B /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/ensembl-vep:103.1--pl5262h4a94de4_2 vep --fasta /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta -i ${scratch_dir}/vep/variants_fil_mod.vcf -o ${scratch_dir}/vep/vep_annot.vcf --cache --offline --dir_cache /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/ --everything --assembly GRCh37 --tab &" > _02_vep_annotation.sh
 
 #--------------------------------------------------------------------------------------------------------------------
 
@@ -72,7 +72,7 @@ sed -i "s|OUTPUT_FOLDER|${output_folder}|g" ./exomiser_configfile.yml
 
 # THE FILE "spring.log" MUST BE DELETED IN THE CORRESPONDING NODE
 echo "java -Xms2g -Xmx4g -jar exomiser-cli-13.0.0.jar --analysis ${scratch_dir}/exomiser_configfile.yml; rm /tmp/spring.log" > aux_04_exomiser_exome.sh
-echo "srun --partition short_idx --mem 100G --time 2:00:00 --chdir /data/bi/pipelines/exomiser/exomiser-cli-13.0.0 --output logs/EXOMISER.log --job-name EXOMISER bash ${scratch_dir}/aux_04_exomiser_exome.sh &" > _04_exomiser_exome.sh
+echo "srun --partition short_idx --mem 100G --time 2:00:00 --chdir /data/ucct/bi/pipelines/exomiser/exomiser-cli-13.0.0 --output logs/EXOMISER.log --job-name EXOMISER bash ${scratch_dir}/aux_04_exomiser_exome.sh &" > _04_exomiser_exome.sh
 
 #---------------------------------------------------------------------------------------------------------
 
diff --git a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog
index 3eda4044a..e3fc7690e 100644
--- a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog
+++ b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog
@@ -3,7 +3,7 @@
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 mkdir logs
 
-cat ../samples_id.txt | xargs -I @@ echo "srun --partition short_idx --mem 100G --time 2:00:00 --chdir ${scratch_dir} --output logs/PICARDHSMETRICS.@@.%j.log --job-name PICARDHSMETRICS singularity exec -B ${scratch_dir}/../../../ -B /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/ /data/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectHsMetrics -R /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37_decoy.fasta -BI ${scratch_dir}/../../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37.interval_list -TI ${scratch_dir}/../../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37.interval_list -I ${scratch_dir}/../01-sarek/preprocessing/recalibrated/@@/@@.recal.cram -O ${scratch_dir}/@@_hsMetrics.out -VALIDATION_STRINGENCY LENIENT &" > _01_picardHsMetrics.sh
+cat ../samples_id.txt | xargs -I @@ echo "srun --partition short_idx --mem 100G --time 2:00:00 --chdir ${scratch_dir} --output logs/PICARDHSMETRICS.@@.%j.log --job-name PICARDHSMETRICS singularity exec -B ${scratch_dir}/../../../ -B /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/ /data/ucct/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectHsMetrics -R /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37_decoy.fasta -BI ${scratch_dir}/../../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37.interval_list -TI ${scratch_dir}/../../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37.interval_list -I ${scratch_dir}/../01-sarek/preprocessing/recalibrated/@@/@@.recal.cram -O ${scratch_dir}/@@_hsMetrics.out -VALIDATION_STRINGENCY LENIENT &" > _01_picardHsMetrics.sh
 
 echo "echo "\"SAMPLE\",\"MEAN TARGET COVERAGE\", \"PCT USABLE BASES ON TARGET\",\"FOLD ENRICHMENT\",\"PCT TARGET BASES 10X\",\"PCT TARGET BASES 20X\",\"PCT TARGET BASES 30X\",\"PCT TARGET BASES 40X\",\"PCT TARGET BASES 50X\"" > hsMetrics_all.out" > _02_hsMetrics_all.sh
 cat ../samples_id.txt | xargs -I % echo "grep '^Illumin' %_hsMetrics.out | awk 'BEGIN{FS=\"\\t\";OFS=\",\"}{print \"%\",\$34,\$12,\$13,\$48,\$49,\$50,\$51,\$52}' >> hsMetrics_all.out" >> _02_hsMetrics_all.sh
diff --git a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/lablog b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/lablog
index a7081ffef..2f3513917 100755
--- a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/lablog
+++ b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/lablog
@@ -42,21 +42,21 @@ cat <<EOF > sarek.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/nf-core-sarek/nf-core-sarek_3.4.4/3_4_4/main.nf \\
+nextflow run /data/ucct/bi/pipelines/nf-core-sarek/nf-core-sarek_3.4.4/3_4_4/main.nf \\
           -c ../../DOC/hpc_slurm_sarek.config \\
           --input 'samplesheet.csv' \\
           --outdir 01-sarek \\
           --genome GATK.GRCh37 \\
 	  	  --wes \\
           --intervals '../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37_mod.bed' \\
-          --dbsnp '/data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/variants/20131208/dbsnp_138_mod.b37.vcf.gz' \\
-	      --dbsnp_tbi '/data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/variants/20131208/dbsnp_138_mod.b37.vcf.gz.tbi' \\
+          --dbsnp '/data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/variants/20131208/dbsnp_138_mod.b37.vcf.gz' \\
+	      --dbsnp_tbi '/data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/variants/20131208/dbsnp_138_mod.b37.vcf.gz.tbi' \\
 	      --dbsnp_vqsr '--resource:dbsnp,known=false,training=true,truth=false,prior=2.0 dbsnp_138_mod.b37.vcf.gz' \\
 	      --tools 'haplotypecaller' \\
           --save_reference \\
           --joint_germline \\
 		  --igenomes_ignore \\
-		  --igenomes_base '/data/bi/references/igenomes/' \\
+		  --igenomes_base '/data/ucct/bi/references/igenomes/' \\
 	  	  -resume
 EOF
 
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/01-preproQC/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/01-preproQC/lablog
index 0062b7b6a..a496affd5 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/01-preproQC/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/01-preproQC/lablog
@@ -4,4 +4,4 @@ mkdir logs
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --cpus-per-task 8 --time 01:00:00 --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../00-reads/"$in"_R1.fastq.gz ${scratch_dir}/../00-reads/"$in"_R2.fastq.gz &"; done > _01_rawfastqc.sh
+cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --cpus-per-task 8 --time 01:00:00 --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../00-reads/"$in"_R1.fastq.gz ${scratch_dir}/../00-reads/"$in"_R2.fastq.gz &"; done > _01_rawfastqc.sh
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/02-preprocessing/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/02-preprocessing/lablog
index 71204967d..1429dcf71 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/02-preprocessing/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/02-preprocessing/lablog
@@ -1,4 +1,4 @@
 # module load singularity
 mkdir logs
-scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
-cat ../samples_id.txt | xargs -I @@ echo "mkdir @@; srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name FP.@@ --output logs/FP.@@.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/bi/pipelines/singularity-images/fastp:0.20.0--hdbcaa40_0 fastp --in1 ${scratch_dir}/../00-reads/@@_R1.fastq.gz --in2 ${scratch_dir}/../00-reads/@@_R2.fastq.gz --thread 5 --cut_front --cut_tail --cut_mean_quality 20 --qualified_quality_phred 20 --trim_poly_x --length_required 50 --detect_adapter_for_pe --json ${scratch_dir}/@@/@@_fastp.json --html ${scratch_dir}/@@/@@_fastp.html --out1 ${scratch_dir}/@@/@@_R1_filtered.fastq.gz --out2 ${scratch_dir}/@@/@@_R2_filtered.fastq.gz --unpaired1 ${scratch_dir}/@@/@@_R1_unpaired.fastq.gz --unpaired2 ${scratch_dir}/@@/@@_R2_unpaired.fastq.gz &" > _01_fastp.sh
+scratch_dir=$(echo $(pwd) | sed 's@/data/ucct/bi/scratch_tmp/@/scratch/@g')
+cat ../samples_id.txt | xargs -I @@ echo "mkdir @@; srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name FP.@@ --output logs/FP.@@.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/ucct/bi/pipelines/singularity-images/fastp:0.20.0--hdbcaa40_0 fastp --in1 ${scratch_dir}/../00-reads/@@_R1.fastq.gz --in2 ${scratch_dir}/../00-reads/@@_R2.fastq.gz --thread 5 --cut_front --cut_tail --cut_mean_quality 20 --qualified_quality_phred 20 --trim_poly_x --length_required 50 --detect_adapter_for_pe --json ${scratch_dir}/@@/@@_fastp.json --html ${scratch_dir}/@@/@@_fastp.html --out1 ${scratch_dir}/@@/@@_R1_filtered.fastq.gz --out2 ${scratch_dir}/@@/@@_R2_filtered.fastq.gz --unpaired1 ${scratch_dir}/@@/@@_R1_unpaired.fastq.gz --unpaired2 ${scratch_dir}/@@/@@_R2_unpaired.fastq.gz &" > _01_fastp.sh
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/03-procQC/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/03-procQC/lablog
index 767eff884..c860c2561 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/03-procQC/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/03-procQC/lablog
@@ -4,4 +4,4 @@ mkdir logs
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz &"; done > _01_preprofastqc.sh
+cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz &"; done > _01_preprofastqc.sh
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/04-Alignment/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/04-Alignment/lablog
index 8f61e3cf8..d52189714 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/04-Alignment/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/04-Alignment/lablog
@@ -4,15 +4,15 @@ mkdir logs
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --chdir $scratch_dir --output logs/BWAMEM.${in}.%j.log --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/bwa:0.7.17--he4a0461_11 bwa mem -t 20 REFERENCE_GENOME ${scratch_dir}/../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz -o ${scratch_dir}/${in}/${in}.sam &"; done >> _01_bwamem.sh
+cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --chdir $scratch_dir --output logs/BWAMEM.${in}.%j.log --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/bwa:0.7.17--he4a0461_11 bwa mem -t 20 REFERENCE_GENOME ${scratch_dir}/../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz -o ${scratch_dir}/${in}/${in}.sam &"; done >> _01_bwamem.sh
 
-cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir $scratch_dir --output logs/SAMTOOLS_VIEW.${in}.%j.log --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools view -bS ${scratch_dir}/${in}/${in}.sam -o ${scratch_dir}/${in}/${in}.bam &"; done >> _02_samtools_view.sh
+cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir $scratch_dir --output logs/SAMTOOLS_VIEW.${in}.%j.log --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools view -bS ${scratch_dir}/${in}/${in}.sam -o ${scratch_dir}/${in}/${in}.bam &"; done >> _02_samtools_view.sh
 
-cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir $scratch_dir --output logs/SAMTOOLS_SORT.${in}.%j.log --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools sort -@ 20 -o ${scratch_dir}/${in}/${in}_sorted.bam -T ${scratch_dir}/${in}/${in}_sorted ${scratch_dir}/${in}/${in}.bam &"; done >> _03_samtools_sort.sh
+cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir $scratch_dir --output logs/SAMTOOLS_SORT.${in}.%j.log --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools sort -@ 20 -o ${scratch_dir}/${in}/${in}_sorted.bam -T ${scratch_dir}/${in}/${in}_sorted ${scratch_dir}/${in}/${in}.bam &"; done >> _03_samtools_sort.sh
 
-cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir $scratch_dir --output logs/PICARD_ADDORREPLACE.${in}.%j.log --mem 251346M --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard AddOrReplaceReadGroups VALIDATION_STRINGENCY=LENIENT INPUT=${scratch_dir}/${in}/${in}_sorted.bam OUTPUT=${scratch_dir}/${in}/${in}_sorted_rg.bam RGID=2022-NEXTERA-NOVASEQ-ILLUMINA-ISCIII RGLB=NEXTERA RGPL=ILLUMINA RGSM=${scratch_dir}/${in} RGPU=A01158 RGDT=2022 RGCN=ISCIII TMP_DIR=${scratch_dir}/../../../TMP/${in} &"; done >> _04_picard_replacegroups.sh
+cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir $scratch_dir --output logs/PICARD_ADDORREPLACE.${in}.%j.log --mem 251346M --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard AddOrReplaceReadGroups VALIDATION_STRINGENCY=LENIENT INPUT=${scratch_dir}/${in}/${in}_sorted.bam OUTPUT=${scratch_dir}/${in}/${in}_sorted_rg.bam RGID=2022-NEXTERA-NOVASEQ-ILLUMINA-ISCIII RGLB=NEXTERA RGPL=ILLUMINA RGSM=${scratch_dir}/${in} RGPU=A01158 RGDT=2022 RGCN=ISCIII TMP_DIR=${scratch_dir}/../../../TMP/${in} &"; done >> _04_picard_replacegroups.sh
 
-cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir $scratch_dir --output logs/SAMTOOLS_INDEX.${in}.%j.log --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools index ${scratch_dir}/${in}/${in}_sorted_rg.bam &"; done >> _05_samtools_index.sh
+cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir $scratch_dir --output logs/SAMTOOLS_INDEX.${in}.%j.log --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools index ${scratch_dir}/${in}/${in}_sorted_rg.bam &"; done >> _05_samtools_index.sh
 
 #clean
 #rm */*[0-9].sam
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/05-mark_dups/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/05-mark_dups/lablog
index dbef85b25..edd952a14 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/05-mark_dups/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/05-mark_dups/lablog
@@ -4,10 +4,10 @@ mkdir logs
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-cat ../samples_id.txt | while read in; do mkdir ${in}; echo "srun --partition short_idx --chdir $scratch_dir --output logs/PICARD_DUPLICATES.${in}.%j.log --mem 251346M --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard MarkDuplicates ASSUME_SORTED=true VALIDATION_STRINGENCY=LENIENT REMOVE_DUPLICATES=false INPUT=${scratch_dir}/../04-Alignment/${in}/${in}_sorted_rg.bam OUTPUT=${scratch_dir}/${in}/${in}_woduplicates.bam METRICS_FILE=${scratch_dir}/${in}/${in}_duplicates.stats TMP_DIR=${scratch_dir}/../../../TMP/${in} &"; done > _01_picard_dups.sh
+cat ../samples_id.txt | while read in; do mkdir ${in}; echo "srun --partition short_idx --chdir $scratch_dir --output logs/PICARD_DUPLICATES.${in}.%j.log --mem 251346M --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard MarkDuplicates ASSUME_SORTED=true VALIDATION_STRINGENCY=LENIENT REMOVE_DUPLICATES=false INPUT=${scratch_dir}/../04-Alignment/${in}/${in}_sorted_rg.bam OUTPUT=${scratch_dir}/${in}/${in}_woduplicates.bam METRICS_FILE=${scratch_dir}/${in}/${in}_duplicates.stats TMP_DIR=${scratch_dir}/../../../TMP/${in} &"; done > _01_picard_dups.sh
 
-cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir $scratch_dir --output logs/PICARD_ADDORREPLACE.${in}.%j.log --mem 251346M --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard AddOrReplaceReadGroups VALIDATION_STRINGENCY=LENIENT INPUT=${scratch_dir}/${in}/${in}_woduplicates.bam OUTPUT=${scratch_dir}/${in}/${in}_rg.bam RGID=${scratch_dir}/${in} RGLB=NEXTERA RGPL=ILLUMINA RGSM=${scratch_dir}/${in} RGPU=A01158 RGDT=2022 RGCN=ISCIII TMP_DIR=${scratch_dir}/../../../TMP/${in} &"; done > _02_picard_replacegroups.sh
+cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir $scratch_dir --output logs/PICARD_ADDORREPLACE.${in}.%j.log --mem 251346M --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard AddOrReplaceReadGroups VALIDATION_STRINGENCY=LENIENT INPUT=${scratch_dir}/${in}/${in}_woduplicates.bam OUTPUT=${scratch_dir}/${in}/${in}_rg.bam RGID=${scratch_dir}/${in} RGLB=NEXTERA RGPL=ILLUMINA RGSM=${scratch_dir}/${in} RGPU=A01158 RGDT=2022 RGCN=ISCIII TMP_DIR=${scratch_dir}/../../../TMP/${in} &"; done > _02_picard_replacegroups.sh
 
-cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir $scratch_dir --output logs/SAMTOOLS_SORT.${in}.%j.log --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools sort -@ 20 -o ${scratch_dir}/${in}/${in}_sorted_rg.bam -T ${scratch_dir}/${in}/${in}_sorted_rg ${scratch_dir}/${in}/${in}_rg.bam &"; done > _03_samtools_sort.sh
+cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir $scratch_dir --output logs/SAMTOOLS_SORT.${in}.%j.log --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools sort -@ 20 -o ${scratch_dir}/${in}/${in}_sorted_rg.bam -T ${scratch_dir}/${in}/${in}_sorted_rg ${scratch_dir}/${in}/${in}_rg.bam &"; done > _03_samtools_sort.sh
 
-cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir $scratch_dir --output logs/SAMTOOLS_INDEX.${in}.%j.log --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools index ${scratch_dir}/${in}/${in}_sorted_rg.bam &"; done > _04_samtools_index.sh
+cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir $scratch_dir --output logs/SAMTOOLS_INDEX.${in}.%j.log --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools index ${scratch_dir}/${in}/${in}_sorted_rg.bam &"; done > _04_samtools_index.sh
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/06-freebayes/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/06-freebayes/lablog
index 05d95e1c6..6dde10961 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/06-freebayes/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/06-freebayes/lablog
@@ -14,7 +14,7 @@ cat <<EOF > freebayes.sbatch
 #SBATCH --output logs/freebayes.log
 #SBATCH --chdir $scratch_dir
 
-singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/freebayes:1.3.6--hb0f3ef8_4 freebayes -f REFERENCE_GENOME --bam-list ${scratch_dir}/bam_list.txt --pooled-continuous -F 0.1 -C 1 | singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/freebayes:1.3.6--hb0f3ef8_4 vcffilter -f "QUAL > 20" > all_samples.vcf
+singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/freebayes:1.3.6--hb0f3ef8_4 freebayes -f REFERENCE_GENOME --bam-list ${scratch_dir}/bam_list.txt --pooled-continuous -F 0.1 -C 1 | singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/freebayes:1.3.6--hb0f3ef8_4 vcffilter -f "QUAL > 20" > all_samples.vcf
 
 EOF
 
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/07-snphylo/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/07-snphylo/lablog
index d8ec25036..34cc7337b 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/07-snphylo/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/07-snphylo/lablog
@@ -4,4 +4,4 @@ scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
 
 mkdir logs
 
-echo "srun --partition short_idx --chdir $scratch_dir --output logs/SNPPHYLO.%j.log Rscript /data/bi/pipelines/snphylo/SNPhylo/scripts/generate_snp_sequence.R -o 'snphylo.output' -l 2 -M 0.5 -v ../06-freebayes/all_samples.vcf &" > _01_snpphylo.sh
+echo "srun --partition short_idx --chdir $scratch_dir --output logs/SNPPHYLO.%j.log Rscript /data/ucct/bi/pipelines/snphylo/SNPhylo/scripts/generate_snp_sequence.R -o 'snphylo.output' -l 2 -M 0.5 -v ../06-freebayes/all_samples.vcf &" > _01_snpphylo.sh
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/08-iqtree/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/08-iqtree/lablog
index 58ac99835..3eb5954ae 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/08-iqtree/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/08-iqtree/lablog
@@ -2,5 +2,5 @@
 
 scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
 mkdir log
-echo "srun --chdir ${scratch_dir} --output logs/IQTREEMFP.%j.log --job-name IQTREEMFP --cpus-per-task 20 --mem 5G --partition short_idx --time 00:30:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../07-snphylo/snphylo.output.fasta -m MFP &" > _00_iqtreemfp.sh
-echo "srun --chdir ${scratch_dir} --output logs/IQTREEFULLALIGN.%j.log --job-name IQTREEFULLALIGN --cpus-per-task 20 --mem 15G --partition short_idx --time 08:00:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../07-snphylo/snphylo.output.fasta -m PMB+F+R2 -T 20 -B 1000 -pre phylo.iqtree.bootstrap &" > _01_iqtreeall.sh
+echo "srun --chdir ${scratch_dir} --output logs/IQTREEMFP.%j.log --job-name IQTREEMFP --cpus-per-task 20 --mem 5G --partition short_idx --time 00:30:00 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../07-snphylo/snphylo.output.fasta -m MFP &" > _00_iqtreemfp.sh
+echo "srun --chdir ${scratch_dir} --output logs/IQTREEFULLALIGN.%j.log --job-name IQTREEFULLALIGN --cpus-per-task 20 --mem 15G --partition short_idx --time 08:00:00 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../07-snphylo/snphylo.output.fasta -m PMB+F+R2 -T 20 -B 1000 -pre phylo.iqtree.bootstrap &" > _01_iqtreeall.sh
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/99-stats/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/99-stats/lablog
index 384e269c3..98989b223 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/99-stats/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/99-stats/lablog
@@ -25,14 +25,14 @@ echo \$SAMPLE_LIST
 SAMPLE=\${SAMPLE_LIST[\${SLURM_ARRAY_TASK_ID}-1]}
 echo \$SAMPLE
 
-singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools flagstat ${scratch_dir}/../04-Alignment/\${SAMPLE}/\${SAMPLE}_sorted_rg.bam > samtools_flagstats/\${SAMPLE}_flagstats.txt
+singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools flagstat ${scratch_dir}/../04-Alignment/\${SAMPLE}/\${SAMPLE}_sorted_rg.bam > samtools_flagstats/\${SAMPLE}_flagstats.txt
 
 EOF
 
 echo "sbatch samtools_flagstats.sbatch" > _01_samtools_flagstats.sh
 echo "Done"
 
-cat ../samples_id.txt | xargs -I @@ echo "srun --chdir $scratch_dir --output logs/PICARD_@@.%j.log --job-name picard_@@ --partition short_idx --time 2:00:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectWgsMetrics -VALIDATION_STRINGENCY LENIENT -I ${scratch_dir}/../04-Alignment/@@/@@_sorted_rg.bam -O ${scratch_dir}/picard/@@_collect_wgs_metrics.txt -R REFERENCE_GENOME &" > _02_wgsmetrics.sh
+cat ../samples_id.txt | xargs -I @@ echo "srun --chdir $scratch_dir --output logs/PICARD_@@.%j.log --job-name picard_@@ --partition short_idx --time 2:00:00 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectWgsMetrics -VALIDATION_STRINGENCY LENIENT -I ${scratch_dir}/../04-Alignment/@@/@@_sorted_rg.bam -O ${scratch_dir}/picard/@@_collect_wgs_metrics.txt -R REFERENCE_GENOME &" > _02_wgsmetrics.sh
 
 echo "printf \"SAMPLENAME\t\$(grep \"GENOME_TERRITORY\" */*collect_wgs_metrics.txt | cut -d\":\" -f2 | sed 's/ /_/g'| sort -u)\n\" > wgs_metrics_all.txt" > _03_gather_wgs_metrics.sh
 
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/99-stats/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/99-stats/lablog
index 246dae5d4..74f1c4941 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/99-stats/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/99-stats/lablog
@@ -16,7 +16,7 @@ cat <<EOF > multiqc.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/multiqc:1.9--py_1 multiqc -d . --config multiqc_config.yaml
+singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/multiqc:1.9--py_1 multiqc -d . --config multiqc_config.yaml
 
 EOF
 
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog
index 0086364db..fc3789a6a 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog
@@ -17,11 +17,11 @@ cat <<EOF > mag.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-2.5.3/workflow/main.nf \\
+nextflow run /data/ucct/bi/pipelines/nf-core-mag/nf-core-mag-2.5.3/workflow/main.nf \\
           -c ../../DOC/mag.config \\
           --input '00-reads/*_R{1,2}.fastq.gz' \\
           --outdir $(date '+%Y%m%d')_mag \\
-          --kraken2_db /data/bi/references/kraken/k2_pluspf_20231009.tar.gz \\
+          --kraken2_db /data/ucct/bi/references/kraken/k2_pluspf_20231009.tar.gz \\
           --skip_busco --skip_spades --skip_spadeshybrid --skip_megahit --skip_prodigal --skip_binning \\
           -resume
 EOF
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/01-fastQC/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/01-fastQC/lablog
index c90459473..a334d1e89 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/01-fastQC/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/01-fastQC/lablog
@@ -2,4 +2,4 @@
 
 scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
 mkdir logs
-cat ../samples_id.txt | xargs -I @@ echo "mkdir @@;srun --chdir ${scratch_dir} --output logs/FASTQC.@@.%j.log --job-name FASTQC --cpus-per-task 8 --mem 8192 --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/@@ --nogroup -t 8 -k 8 ${scratch_dir}/../00-reads/@@_R1.fastq.gz ${scratch_dir}/../00-reads/@@_R2.fastq.gz &" >> _01_fastqc.sh
+cat ../samples_id.txt | xargs -I @@ echo "mkdir @@;srun --chdir ${scratch_dir} --output logs/FASTQC.@@.%j.log --job-name FASTQC --cpus-per-task 8 --mem 8192 --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/@@ --nogroup -t 8 -k 8 ${scratch_dir}/../00-reads/@@_R1.fastq.gz ${scratch_dir}/../00-reads/@@_R2.fastq.gz &" >> _01_fastqc.sh
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/02-preprocessing/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/02-preprocessing/lablog
index 46ab047bb..12b07be38 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/02-preprocessing/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/02-preprocessing/lablog
@@ -1,4 +1,4 @@
 # module load fastp
 mkdir logs
-scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
+scratch_dir=$(echo $(pwd) | sed 's@/data/ucct/bi/scratch_tmp/@/scratch/@g')
 cat ../samples_id.txt | xargs -I @@ echo "mkdir @@; srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name FP.@@ --output logs/FP.@@.%j.log --partition short_idx --cpus-per-task 5 fastp --in1 ../00-reads/@@_R1.fastq.gz --in2 ../00-reads/@@_R2.fastq.gz --thread 5 --cut_front --cut_tail --cut_mean_quality 15 --qualified_quality_phred 15 --trim_poly_x --length_required 50 --detect_adapter_for_pe --json @@/@@_fastp.json --html @@/@@_fastp.html --out1 @@/@@_R1_filtered.fastq.gz --out2 @@/@@_R2_filtered.fastq.gz --unpaired1 @@/@@_R1_unpaired.fastq.gz --unpaired2 @@/@@_R2_unpaired.fastq.gz &" > _01_fastp.sh
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/03-preprocQC/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/03-preprocQC/lablog
index 67e34c5c0..4be9b022a 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/03-preprocQC/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/03-preprocQC/lablog
@@ -2,4 +2,4 @@
 
 scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
 mkdir logs
-cat ../samples_id.txt | xargs -I @@ echo "mkdir @@;srun --chdir ${scratch_dir} --output logs/FASTQC.@@.%j.log --job-name FASTQC --cpus-per-task 8 --mem 8192 --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/@@ --nogroup -t 8 -k 8 ${scratch_dir}/../02-preprocessing/@@/@@_R1_filtered.fastq ${scratch_dir}/../02-preprocessing/@@/@@_R2_filtered.fastq &" >> _01_fastqc.sh
+cat ../samples_id.txt | xargs -I @@ echo "mkdir @@;srun --chdir ${scratch_dir} --output logs/FASTQC.@@.%j.log --job-name FASTQC --cpus-per-task 8 --mem 8192 --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/@@ --nogroup -t 8 -k 8 ${scratch_dir}/../02-preprocessing/@@/@@_R1_filtered.fastq ${scratch_dir}/../02-preprocessing/@@/@@_R2_filtered.fastq &" >> _01_fastqc.sh
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/04-mapping/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/04-mapping/lablog
index 3d163bd4d..908810446 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/04-mapping/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/04-mapping/lablog
@@ -24,9 +24,9 @@ SAMPLE=\${SAMPLE_LIST[\${SLURM_ARRAY_TASK_ID}-1]}
 echo \$SAMPLE
 
 mkdir \$SAMPLE
-singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/bwa:0.7.17--he4a0461_11 bwa mem -t 4 /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta ${scratch_dir}/../02-preprocessing/\$SAMPLE/\${SAMPLE}_R1_filtered.fastq.gz ${scratch_dir}/../02-preprocessing/\$SAMPLE/\${SAMPLE}_R2_filtered.fastq.gz | singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools view -bS -o ${scratch_dir}/\$SAMPLE/\${SAMPLE}.bam -
-singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools sort ${scratch_dir}/\${SAMPLE}/\${SAMPLE}.bam -T ${scratch_dir}/\${SAMPLE}_sorted -o ${scratch_dir}/\${SAMPLE}/\${SAMPLE}_sorted.bam
-singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools index ${scratch_dir}/\${SAMPLE}/\${SAMPLE}_sorted.bam
+singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/bwa:0.7.17--he4a0461_11 bwa mem -t 4 /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta ${scratch_dir}/../02-preprocessing/\$SAMPLE/\${SAMPLE}_R1_filtered.fastq.gz ${scratch_dir}/../02-preprocessing/\$SAMPLE/\${SAMPLE}_R2_filtered.fastq.gz | singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools view -bS -o ${scratch_dir}/\$SAMPLE/\${SAMPLE}.bam -
+singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools sort ${scratch_dir}/\${SAMPLE}/\${SAMPLE}.bam -T ${scratch_dir}/\${SAMPLE}_sorted -o ${scratch_dir}/\${SAMPLE}/\${SAMPLE}_sorted.bam
+singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools index ${scratch_dir}/\${SAMPLE}/\${SAMPLE}_sorted.bam
 rm \${SAMPLE}/\${SAMPLE}.bam
 
 EOF
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/05-samtools/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/05-samtools/lablog
index 4701f0c8b..04e55c81b 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/05-samtools/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/05-samtools/lablog
@@ -22,7 +22,7 @@ SAMPLE_LIST=(\$(<$samples_file))
 SAMPLE=\${SAMPLE_LIST[\${SLURM_ARRAY_TASK_ID}-1]}
 
 mkdir \$SAMPLE
-singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools mpileup -A -d 20000 -Q 0 -f /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta ${scratch_dir}/../04-mapping/\${SAMPLE}/\${SAMPLE}_sorted.bam > \${SAMPLE}/\${SAMPLE}.pileup
+singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools mpileup -A -d 20000 -Q 0 -f /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta ${scratch_dir}/../04-mapping/\${SAMPLE}/\${SAMPLE}_sorted.bam > \${SAMPLE}/\${SAMPLE}.pileup
 
 EOF
 
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/06-VarScan/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/06-VarScan/lablog
index 3c918e137..f47c75f19 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/06-VarScan/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/06-VarScan/lablog
@@ -22,7 +22,7 @@ SAMPLE_LIST=(\$(<$samples_file))
 SAMPLE=\${SAMPLE_LIST[\${SLURM_ARRAY_TASK_ID}-1]}
 
 mkdir \$SAMPLE
-singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/varscan:2.4.4--hdfd78af_1 varscan mpileup2cns ${scratch_dir}/../05-samtools/\${SAMPLE}/\${SAMPLE}.pileup --min-var-freq 0.05 --p-value 0.99 --variants --output-vcf 1 > \${SAMPLE}/\${SAMPLE}.vcf
+singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/varscan:2.4.4--hdfd78af_1 varscan mpileup2cns ${scratch_dir}/../05-samtools/\${SAMPLE}/\${SAMPLE}.pileup --min-var-freq 0.05 --p-value 0.99 --variants --output-vcf 1 > \${SAMPLE}/\${SAMPLE}.vcf
 bgzip \${SAMPLE}/\${SAMPLE}.vcf
 tabix \${SAMPLE}/\${SAMPLE}.vcf.gz
 EOF
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/07-annotation/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/07-annotation/lablog
index 584fe9b36..1640cd2f5 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/07-annotation/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/07-annotation/lablog
@@ -20,14 +20,14 @@ SAMPLE_LIST=(\$(<$samples_file))
 SAMPLE=\${SAMPLE_LIST[\${SLURM_ARRAY_TASK_ID}-1]}
 
 mkdir \$SAMPLE
-singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/bcftools:1.12--h45bccc9_1 bcftools query -H ${scratch_dir}/../06-VarScan/\${SAMPLE}/\${SAMPLE}.vcf.gz -f '%CHROM\t%POS\t%REF\t%ALT\t%FILTER[\t%GT\t%DP\t%RD\t%AD\t%FREQ\t%PVAL\t%RBQ\t%ABQ\t%RDF\t%RDR\t%ADF\t%ADR]\n' > \${SAMPLE}/\${SAMPLE}.table
+singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/bcftools:1.12--h45bccc9_1 bcftools query -H ${scratch_dir}/../06-VarScan/\${SAMPLE}/\${SAMPLE}.vcf.gz -f '%CHROM\t%POS\t%REF\t%ALT\t%FILTER[\t%GT\t%DP\t%RD\t%AD\t%FREQ\t%PVAL\t%RBQ\t%ABQ\t%RDF\t%RDR\t%ADF\t%ADR]\n' > \${SAMPLE}/\${SAMPLE}.table
 EOF
 
 echo "sbatch bcftools_query.sbatch" > _01_bcftools_query.sh
 
 
 # module load Java/1.8.0_281 R/4.1.0-foss-2021a
-cat ../samples_id.txt | xargs -I @@ echo "mkdir @@;srun --chdir ${scratch_dir} --output logs/KGGSEQ.@@.%j.log --job-name KGGSEQ --cpus-per-task 1 --mem 8192 --partition short_idx --time 02:00:00 java -jar -Xmx8g /data/bi/pipelines/kggseq/kggseqhg19/kggseq.jar --no-web --buildver hg19 --vcf-file ../06-VarScan/@@/@@.vcf.gz --db-gene refgene --db-score dbnsfp --genome-annot --db-filter ESP5400,dbsnp141,1kg201305 --rare-allele-freq 1 --mendel-causing-predict best --omim-annot --out @@/@@_annot.txt --no-qc &" > _02_kggseq.sh
+cat ../samples_id.txt | xargs -I @@ echo "mkdir @@;srun --chdir ${scratch_dir} --output logs/KGGSEQ.@@.%j.log --job-name KGGSEQ --cpus-per-task 1 --mem 8192 --partition short_idx --time 02:00:00 java -jar -Xmx8g /data/ucct/bi/pipelines/kggseq/kggseqhg19/kggseq.jar --no-web --buildver hg19 --vcf-file ../06-VarScan/@@/@@.vcf.gz --db-gene refgene --db-score dbnsfp --genome-annot --db-filter ESP5400,dbsnp141,1kg201305 --rare-allele-freq 1 --mendel-causing-predict best --omim-annot --out @@/@@_annot.txt --no-qc &" > _02_kggseq.sh
 cat ../samples_id.txt | xargs -I % echo "gunzip %/%_annot.txt.flt.txt.gz" > _03_final_table.sh
 cat ../samples_id.txt | xargs -I % echo 'cp header %/%_header.table && tail -n +2 %/%.table >> %/%_header.table'  >> _03_final_table.sh
 cat ../samples_id.txt | xargs -I % echo "Rscript merge_parse.R %" >> _03_final_table.sh
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/99-stats/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/99-stats/lablog
index eae0de465..1ad62c614 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/99-stats/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/99-stats/lablog
@@ -3,9 +3,9 @@
 scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
 mkdir logs
 
-cat ../samples_id.txt | xargs -I @@ echo "srun --chdir ${scratch_dir} --output logs/PICARD.@@.%j.log --job-name PICARD --cpus-per-task 1 --mem 8192 --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectHsMetrics -BI ${scratch_dir}/../../../REFERENCES/idt_rb1_panel_20221123.interval_list -TI ${scratch_dir}/../../../REFERENCES/idt_rb1_panel_20221123.interval_list -I ${scratch_dir}/../04-mapping/@@/@@_sorted.bam -O ${scratch_dir}/@@_hsMetrics.out -VALIDATION_STRINGENCY 'LENIENT' &" > _01_picardHsMetrics.sh
+cat ../samples_id.txt | xargs -I @@ echo "srun --chdir ${scratch_dir} --output logs/PICARD.@@.%j.log --job-name PICARD --cpus-per-task 1 --mem 8192 --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectHsMetrics -BI ${scratch_dir}/../../../REFERENCES/idt_rb1_panel_20221123.interval_list -TI ${scratch_dir}/../../../REFERENCES/idt_rb1_panel_20221123.interval_list -I ${scratch_dir}/../04-mapping/@@/@@_sorted.bam -O ${scratch_dir}/@@_hsMetrics.out -VALIDATION_STRINGENCY 'LENIENT' &" > _01_picardHsMetrics.sh
 
 echo "echo "\"SAMPLE\",\"MEAN TARGET COVERAGE\", \"PCT USABLE BASES ON TARGET\",\"FOLD ENRICHMENT\",\"PCT TARGET BASES 10X\",\"PCT TARGET BASES 20X\",\"PCT TARGET BASES 30X\",\"PCT TARGET BASES 40X\",\"PCT TARGET BASES 50X\"" > hsMetrics_all.out" > _02_hsMetrics_all.sh
 cat ../../samples_id.txt | xargs -I % echo "grep '^idt_rb1_panel' %_hsMetrics.out | awk 'BEGIN{FS=\"\\t\";OFS=\",\"}{print \"%\",\$34,\$12,\$13,\$49,\$50,\$60,\$61}' >> hsMetrics_all.out" >> _02_hsMetrics_all.sh
 
-echo "srun --chdir ${scratch_dir} --output logs/MULTIQC.%j.log --job-name MULTIQC --cpus-per-task 1 --mem 8192 --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/multiqc:1.9--py_1 multiqc -v --config ${scratch_dir}/multiqc_config.yaml .." > _03_run_multiqc.sh
+echo "srun --chdir ${scratch_dir} --output logs/MULTIQC.%j.log --job-name MULTIQC --cpus-per-task 1 --mem 8192 --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/multiqc:1.9--py_1 multiqc -v --config ${scratch_dir}/multiqc_config.yaml .." > _03_run_multiqc.sh
diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_TAXPROFILER/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_TAXPROFILER/lablog
index 06bd2f6bf..d08d846ff 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_TAXPROFILER/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_TAXPROFILER/lablog
@@ -67,7 +67,7 @@ cat <<EOF > taxprofiler.sbatch
 # module load Nextflow/23.10.0 singularity
 export NXF_OPTS="-Xms500M -Xmx6G"
 
-nextflow run /data/bi/pipelines/nf-core-taxprofiler/nf-core-taxprofiler-1.1.8 \\
+nextflow run /data/ucct/bi/pipelines/nf-core-taxprofiler/nf-core-taxprofiler-1.1.8 \\
     -profile singularity \\
     -c ../../DOC/taxprofiler.config \\
     --input samplesheet.csv \\
@@ -78,7 +78,7 @@ nextflow run /data/bi/pipelines/nf-core-taxprofiler/nf-core-taxprofiler-1.1.8 \\
     --perform_shortread_qc true \\
     --shortread_qc_tool fastp \\
     --perform_shortread_hostremoval true \\
-    --hostremoval_reference /data/bi/references/eukaria/homo_sapiens/hg38/NCBI/genome/GCF_000001405.40_GRCh38.p14/GCF_000001405.40_GRCh38.p14_genomic.fna.gz \\
+    --hostremoval_reference /data/ucct/bi/references/eukaria/homo_sapiens/hg38/NCBI/genome/GCF_000001405.40_GRCh38.p14/GCF_000001405.40_GRCh38.p14_genomic.fna.gz \\
     --run_kraken2 true \\
     --run_bracken true \\
     --run_centrifuge true \\
diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/99-stats/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/99-stats/lablog
index 915ddf942..94231de1a 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/99-stats/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/99-stats/lablog
@@ -16,7 +16,7 @@ cat <<EOF > multiqc.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/multiqc:1.9--py_1 multiqc -d . --config multiqc_config.yaml
+singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/multiqc:1.9--py_1 multiqc -d . --config multiqc_config.yaml
 
 EOF
 
diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog
index 87b7052a1..b641a1d25 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog
@@ -25,11 +25,11 @@ cat <<EOF > mag.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-3.0.3/3_0_3/main.nf \\
+nextflow run /data/ucct/bi/pipelines/nf-core-mag/nf-core-mag-3.0.3/3_0_3/main.nf \\
           -c ../../DOC/mag.config \\
           --input samplesheet.csv \\
           --outdir $(date '+%Y%m%d')_mag \\
-          --kraken2_db /data/bi/references/kraken/minikraken_8GB_20200312.tgz \\
+          --kraken2_db /data/ucct/bi/references/kraken/minikraken_8GB_20200312.tgz \\
           --skip_busco --skip_spades --skip_spadeshybrid --skip_megahit --skip_prodigal --skip_binning \\
           -resume
 EOF
diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
index 76d7ff8e1..754af025c 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
@@ -23,11 +23,11 @@ cat <<EOF > mag_all.sbatch
 # module load Nextflow/23.10.0 singularity
 export NXF_OPTS="-Xms500M -Xmx8G"
 
-nextflow run /data/bi/pipelines/nf-core-mag/nf-core-mag-3.0.3/3_0_3/main.nf \\
+nextflow run /data/ucct/bi/pipelines/nf-core-mag/nf-core-mag-3.0.3/3_0_3/main.nf \\
     -c ../../DOC/mag.config \\
     -profile singularity \\
     --input samplesheet.csv \\
-    --kraken2_db '/data/bi/references/kraken/minikraken_8GB_20200312.tgz' \\
+    --kraken2_db '/data/ucct/bi/references/kraken/minikraken_8GB_20200312.tgz' \\
     --skip_spadeshybrid true \\
     --skip_concoct true \\
     --refine_bins_dastool true \\
diff --git a/bu_isciii/templates/mag/DOC/databasesheet.csv b/bu_isciii/templates/mag/DOC/databasesheet.csv
index 18b4afee6..5631f00ce 100644
--- a/bu_isciii/templates/mag/DOC/databasesheet.csv
+++ b/bu_isciii/templates/mag/DOC/databasesheet.csv
@@ -1,6 +1,6 @@
 tool,db_name,db_params,db_path
-kraken2,db1,,/data/bi/references/kraken/k2_standard_16gb_20240605.tar.gz
-bracken,db2,,/data/bi/references/kraken/k2_standard_16gb_20240605.tar.gz
-centrifuge,db3,,/data/bi/references/centrifuge/201612_centrifuge_index_p+h+v.tar.gz
-metaphlan,db4,,/data/bi/references/metaphlan/mpa_vJun23_CHOCOPhlAnSGB_20240/
-kaiju,db5,,/data/bi/references/kaiju/nr_euk_2023-05-10/
+kraken2,db1,,/data/ucct/bi/references/kraken/k2_standard_16gb_20240605.tar.gz
+bracken,db2,,/data/ucct/bi/references/kraken/k2_standard_16gb_20240605.tar.gz
+centrifuge,db3,,/data/ucct/bi/references/centrifuge/201612_centrifuge_index_p+h+v.tar.gz
+metaphlan,db4,,/data/ucct/bi/references/metaphlan/mpa_vJun23_CHOCOPhlAnSGB_20240/
+kaiju,db5,,/data/ucct/bi/references/kaiju/nr_euk_2023-05-10/
diff --git a/bu_isciii/templates/mag/DOC/mag.config b/bu_isciii/templates/mag/DOC/mag.config
index 5f8420a97..6d78de98c 100644
--- a/bu_isciii/templates/mag/DOC/mag.config
+++ b/bu_isciii/templates/mag/DOC/mag.config
@@ -5,7 +5,7 @@
 singularity {
         enabled                 = true
         autoMounts              = true
-        singularity.cacheDir    = '/data/bi/pipelines/singularity-images'
+        singularity.cacheDir    = '/data/ucct/bi/pipelines/singularity-images'
 }
 
 process {
diff --git a/bu_isciii/templates/mag/DOC/taxprofiler.config b/bu_isciii/templates/mag/DOC/taxprofiler.config
index 1d05137fc..6c835bda3 100644
--- a/bu_isciii/templates/mag/DOC/taxprofiler.config
+++ b/bu_isciii/templates/mag/DOC/taxprofiler.config
@@ -5,7 +5,7 @@
 singularity {
     enabled                 = true
     autoMounts              = true
-    singularity.cacheDir    = '/data/bi/pipelines/singularity-images/'
+    singularity.cacheDir    = '/data/ucct/bi/pipelines/singularity-images/'
 }
 
 process {
diff --git a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/01-preprocessing/lablog b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/01-preprocessing/lablog
index aa47fc950..ae8145493 100644
--- a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/01-preprocessing/lablog
+++ b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/01-preprocessing/lablog
@@ -19,8 +19,8 @@ read -p $'\e[1;37mDid you save the trimmed reads from previous assembly pipeline
         echo "Preparing _01_fastp.sh file for trimming..."
         
         mkdir logs
-        scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
-        cat ../samples_id.txt | xargs -I @@ echo "mkdir @@; srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name FP.@@ --output logs/FP.@@.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/bi/pipelines/singularity-images/fastp:0.20.0--hdbcaa40_0 fastp --in1 ${scratch_dir}/../00-reads/@@_R1.fastq.gz --in2 ${scratch_dir}/../00-reads/@@_R2.fastq.gz --thread 5 --cut_front --cut_tail --cut_mean_quality 15 --qualified_quality_phred 15 --trim_poly_x --length_required 50 --detect_adapter_for_pe --json ${scratch_dir}/@@/@@_fastp.json --html ${scratch_dir}/@@/@@_fastp.html --out1 ${scratch_dir}/@@/@@_R1_filtered.fastq.gz --out2 ${scratch_dir}/@@/@@_R2_filtered.fastq.gz --unpaired1 ${scratch_dir}/@@/@@_R1_unpaired.fastq.gz --unpaired2 ${scratch_dir}/@@/@@_R2_unpaired.fastq.gz &" > _01_fastp.sh
+        scratch_dir=$(echo $(pwd) | sed 's@/data/ucct/bi/scratch_tmp/@/scratch/@g')
+        cat ../samples_id.txt | xargs -I @@ echo "mkdir @@; srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name FP.@@ --output logs/FP.@@.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/ucct/bi/pipelines/singularity-images/fastp:0.20.0--hdbcaa40_0 fastp --in1 ${scratch_dir}/../00-reads/@@_R1.fastq.gz --in2 ${scratch_dir}/../00-reads/@@_R2.fastq.gz --thread 5 --cut_front --cut_tail --cut_mean_quality 15 --qualified_quality_phred 15 --trim_poly_x --length_required 50 --detect_adapter_for_pe --json ${scratch_dir}/@@/@@_fastp.json --html ${scratch_dir}/@@/@@_fastp.html --out1 ${scratch_dir}/@@/@@_R1_filtered.fastq.gz --out2 ${scratch_dir}/@@/@@_R2_filtered.fastq.gz --unpaired1 ${scratch_dir}/@@/@@_R1_unpaired.fastq.gz --unpaired2 ${scratch_dir}/@@/@@_R2_unpaired.fastq.gz &" > _01_fastp.sh
 
 	echo -e "\e[32mFile _01_fastp.sh ready.\e[0m"
 
diff --git a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/02-kmerfinder/lablog b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/02-kmerfinder/lablog
index eff310bb1..cbc97034f 100644
--- a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/02-kmerfinder/lablog
+++ b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/02-kmerfinder/lablog
@@ -4,8 +4,8 @@ scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
 mkdir logs
 
-cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir ${scratch_dir} --mem 50G --output logs/KMERFINDER.${in}.%j.log singularity run -B /scratch/bi/ -B /data/bi/references/kmerfinder/20190108_stable_dirs/bacteria /data/bi/pipelines/singularity-images/kmerfinder_v3.0.simg -i ../01-preprocessing/${in}/${in}_R1_filtered.fastq.gz ../01-preprocessing/${in}/${in}_R2_filtered.fastq.gz -o ${scratch_dir}/${in} -db /data/bi/references/kmerfinder/20190108_stable_dirs/bacteria/bacteria.ATG -tax /data/bi/references/kmerfinder/20190108_stable_dirs/bacteria/bacteria.name -x &";done > _01_kmerfinder.sh
+cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --chdir ${scratch_dir} --mem 50G --output logs/KMERFINDER.${in}.%j.log singularity run -B /scratch/bi/ -B /data/ucct/bi/references/kmerfinder/20190108_stable_dirs/bacteria /data/ucct/bi/pipelines/singularity-images/kmerfinder_v3.0.simg -i ../01-preprocessing/${in}/${in}_R1_filtered.fastq.gz ../01-preprocessing/${in}/${in}_R2_filtered.fastq.gz -o ${scratch_dir}/${in} -db /data/ucct/bi/references/kmerfinder/20190108_stable_dirs/bacteria/bacteria.ATG -tax /data/ucct/bi/references/kmerfinder/20190108_stable_dirs/bacteria/bacteria.name -x &";done > _01_kmerfinder.sh
 
 echo "cat ../samples_id.txt | xargs -I % awk '{FS=\"\t\"} NR==2 {print \$1}' %/results.txt | awk '{count[\$0]++} END{for (i in count) {print count[i], i}}' | sort -nr" > _02_find_common_reference.sh
 
-echo "bash _02_find_common_reference.sh | head -n1 | tr ' ' '\t' | cut -f2 | while read in; do bash /data/bi/references/bacteria/download_reference.sh \${in} ../../../REFERENCES/; done" > _03_download_reference.sh
+echo "bash _02_find_common_reference.sh | head -n1 | tr ' ' '\t' | cut -f2 | while read in; do bash /data/ucct/bi/references/bacteria/download_reference.sh \${in} ../../../REFERENCES/; done" > _03_download_reference.sh
diff --git a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/all_samples/lablog b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/all_samples/lablog
index 99a74d18b..a467df4fc 100644
--- a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/all_samples/lablog
+++ b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/all_samples/lablog
@@ -1,7 +1,7 @@
 # module load singularity
 # this will be performed in case a tree is requested
 mkdir logs
-scratch_dir=$(echo $(pwd) | sed "s@/data/bi/scratch_tmp/@/scratch/@g")
+scratch_dir=$(echo $(pwd) | sed "s@/data/ucct/bi/scratch_tmp/@/scratch/@g")
 
 mkdir Amend Bam Called Classification GATK_Bam Groups Joint Mpileup Position_Tables Statistics
 cat ../*/samples.txt > samples.txt
@@ -14,9 +14,9 @@ cd Mpileup; ln -s ../../*/Mpileup/* . ; cd -
 cd Position_Tables; ln -s ../../*/Position_Tables/* . ; cd -
 
 ##### Create join scripts
-echo "srun --job-name MTBSEQ_JOIN  --output logs/MTBSEQ_JOIN.%j.log --partition middle_obx --mem 48G --chdir ${scratch_dir} --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../../ /data/bi/pipelines/singularity-images/mtbseq:1.1.0--hdfd78af_0 MTBseq --step TBjoin --threads 5 --samples ${scratch_dir}/samples.txt &" > _01_tb_join.sh
-echo "srun --job-name MTBSEQ_AMEND  --output logs/MTBSEQ_AMEND.%j.log --partition middle_obx --mem 48G --chdir ${scratch_dir} --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../../ /data/bi/pipelines/singularity-images/mtbseq:1.1.0--hdfd78af_0 MTBseq --step TBamend --threads 5 --samples ${scratch_dir}/samples.txt &" > _02_tb_amend.sh
-echo "srun --job-name MTBSEQ_GROUPS --output logs/MTBSEQ_GROUPS.%j.log --partition middle_obx --mem 48G --chdir ${scratch_dir} --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../../ /data/bi/pipelines/singularity-images/mtbseq:1.1.0--hdfd78af_0 MTBseq --step TBgroups --threads 5 --samples ${scratch_dir}/samples.txt &" > _03_tb_groups.sh
+echo "srun --job-name MTBSEQ_JOIN  --output logs/MTBSEQ_JOIN.%j.log --partition middle_obx --mem 48G --chdir ${scratch_dir} --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../../ /data/ucct/bi/pipelines/singularity-images/mtbseq:1.1.0--hdfd78af_0 MTBseq --step TBjoin --threads 5 --samples ${scratch_dir}/samples.txt &" > _01_tb_join.sh
+echo "srun --job-name MTBSEQ_AMEND  --output logs/MTBSEQ_AMEND.%j.log --partition middle_obx --mem 48G --chdir ${scratch_dir} --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../../ /data/ucct/bi/pipelines/singularity-images/mtbseq:1.1.0--hdfd78af_0 MTBseq --step TBamend --threads 5 --samples ${scratch_dir}/samples.txt &" > _02_tb_amend.sh
+echo "srun --job-name MTBSEQ_GROUPS --output logs/MTBSEQ_GROUPS.%j.log --partition middle_obx --mem 48G --chdir ${scratch_dir} --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../../ /data/ucct/bi/pipelines/singularity-images/mtbseq:1.1.0--hdfd78af_0 MTBseq --step TBgroups --threads 5 --samples ${scratch_dir}/samples.txt &" > _03_tb_groups.sh
 
 #### Execute iqtree
-echo "srun --chdir ${scratch_dir} --output logs/IQTREEFULLALIGN.%j.log --job-name IQTREEFULLALIGN --cpus-per-task 20 --mem 15G --partition short_idx --time 08:00:00 singularity exec -B ${scratch_dir}/../../../../ /data/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/Amend/*amended_u95_phylo_w12.plainIDs.fasta -m K3Pu+F+I -T 20 -B 1000 -pre phylo.iqtree.bootstrap &" > _04_iqtreeall.sh
+echo "srun --chdir ${scratch_dir} --output logs/IQTREEFULLALIGN.%j.log --job-name IQTREEFULLALIGN --cpus-per-task 20 --mem 15G --partition short_idx --time 08:00:00 singularity exec -B ${scratch_dir}/../../../../ /data/ucct/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/Amend/*amended_u95_phylo_w12.plainIDs.fasta -m K3Pu+F+I -T 20 -B 1000 -pre phylo.iqtree.bootstrap &" > _04_iqtreeall.sh
diff --git a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
index 55345c6d5..d6adc353c 100644
--- a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
+++ b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/03-MTBSeq/lablog
@@ -1,7 +1,7 @@
 # module load singularity
 
 # srun parameters
-scratch_dir=$(echo $(pwd) | sed "s@/data/bi/scratch_tmp/@/scratch/@g" )
+scratch_dir=$(echo $(pwd) | sed "s@/data/ucct/bi/scratch_tmp/@/scratch/@g" )
 analysis_year=$(pwd | awk -F'ANALYSIS/' '{print substr($2, 1, 4)}')
 
 mkdir logs
@@ -9,7 +9,7 @@ cat ../samples_id.txt | xargs -I % echo "mkdir %; ln -s ../../01-preprocessing/%
 cat ../samples_id.txt | xargs -I % echo "ln -s ../../01-preprocessing/%/%_R2_filtered.fastq.gz %/%_lib1_R2.fastq.gz" >> _00_prepareRaw.sh
 cat ../samples_id.txt | xargs -I % echo "cd %;ls *.fastq.gz | tr '_' '\t' | cut -f 1,2 | sort -u > samples.txt;cd -" > _01_preparesamples.sh
 
-cat ../samples_id.txt | xargs -I @@ echo -e "srun --job-name MTBSEQ.@@  --output logs/MTBSEQ.@@.%j.log --partition middle_idx --mem 48G --chdir ${scratch_dir}/@@ --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/mtbseq:1.1.0--hdfd78af_0 MTBseq --step TBfull --threads 10 --samples samples.txt &" > _02_mtbseq.sh
+cat ../samples_id.txt | xargs -I @@ echo -e "srun --job-name MTBSEQ.@@  --output logs/MTBSEQ.@@.%j.log --partition middle_idx --mem 48G --chdir ${scratch_dir}/@@ --cpus-per-task 10 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/mtbseq:1.1.0--hdfd78af_0 MTBseq --step TBfull --threads 10 --samples samples.txt &" > _02_mtbseq.sh
 
 # classification
 echo "mkdir classification_all" > _03_gather_results.sh 
diff --git a/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog b/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog
index 83da38684..d722b0b99 100644
--- a/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog
+++ b/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog
@@ -20,7 +20,7 @@ cat <<EOF > pikavirus.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/pikavirus/pikavirus-1.0dev/main.nf \\
+nextflow run /data/ucct/bi/pipelines/pikavirus/pikavirus-1.0dev/main.nf \\
           -c ../../DOC/hpc_slurm_pikavirus.config \\
           --input samplesheet.csv \\
           --kraken_scouting false \\
diff --git a/bu_isciii/templates/pikavirus/DOC/hpc_slurm_pikavirus.config b/bu_isciii/templates/pikavirus/DOC/hpc_slurm_pikavirus.config
index c1794a406..344c454a1 100644
--- a/bu_isciii/templates/pikavirus/DOC/hpc_slurm_pikavirus.config
+++ b/bu_isciii/templates/pikavirus/DOC/hpc_slurm_pikavirus.config
@@ -1,7 +1,7 @@
 process {
   executor = 'slurm'
   queue = 'middle_idx'
-  conda = '/data/bi/pipelines/miniconda3/envs/PikaVirus'
+  conda = '/data/ucct/bi/pipelines/miniconda3/envs/PikaVirus'
   errorStrategy = { task.exitStatus in [140,143,137,138,104,134,139] ? 'retry' : 'finish'; task.exitStatus in [1,4,255] ? 'ignore' : 'finish' }
   maxRetries = 5
   maxErrors = '-1'
@@ -10,13 +10,13 @@ process {
 params {
   config_profile_name = 'ISCIII HPC profile'
   config_profile_description = 'Profile designed for the High Performance Computer in the ISCIII'
-  kraken2_db = "/data/bi/references/kraken/minikraken_8GB_20200312"
-  vir_ref_dir = "/data/bi/references/PikaVirus/viral_assemblies_for_pikavirus"
-  vir_dir_repo = "/data/bi/references/PikaVirus/viral_assemblies.tsv"
-  bact_ref_dir = "/data/bi/references/PikaVirus/bacteria_assemblies_for_pikavirus"
-  bact_dir_repo = "/data/bi/references/PikaVirus/bacteria_assemblies.tsv"
-  fungi_ref_dir = "/data/bi/references/PikaVirus/fungi_assemblies_for_pikavirus"
-  fungi_dir_repo = "/data/bi/references/PikaVirus/fungi_assemblies.tsv"
+  kraken2_db = "/data/ucct/bi/references/kraken/minikraken_8GB_20200312"
+  vir_ref_dir = "/data/ucct/bi/references/PikaVirus/viral_assemblies_for_pikavirus"
+  vir_dir_repo = "/data/ucct/bi/references/PikaVirus/viral_assemblies.tsv"
+  bact_ref_dir = "/data/ucct/bi/references/PikaVirus/bacteria_assemblies_for_pikavirus"
+  bact_dir_repo = "/data/ucct/bi/references/PikaVirus/bacteria_assemblies.tsv"
+  fungi_ref_dir = "/data/ucct/bi/references/PikaVirus/fungi_assemblies_for_pikavirus"
+  fungi_dir_repo = "/data/ucct/bi/references/PikaVirus/fungi_assemblies.tsv"
   outdir = "01-PikaVirus-results"
   max_memory = 376.GB
   max_cpus = 32
diff --git a/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/lablog b/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/lablog
index b6d0b61ec..4e45d1ac0 100644
--- a/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/lablog
+++ b/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/lablog
@@ -4,6 +4,6 @@ mkdir logs
 scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
 ln -s ../samples_id.txt .
 
-cat ../samples_id.txt | xargs -I @@ echo "srun --chdir $scratch_dir --output logs/PLASMIDID.@@.%j.log --job-name PLASMIDID_@@ --partition short_idx --time 05:00:00 env - PATH="$PATH" singularity exec --bind /data/bi/references/ --bind ${scratch_dir} --bind ${scratch_dir}/../../ /data/bi/pipelines/singularity-images/depot.galaxyproject.org-singularity-plasmidid-1.6.5--hdfd78af_0.img plasmidID -1 ${scratch_dir}/../*ASSEMBLY/01-processing/fastp/@@_1.fastp.fastq.gz -2 ${scratch_dir}/../*ASSEMBLY/01-processing/fastp/@@_2.fastp.fastq.gz -d /data/bi/references/plasmidID/plasmid_ddbb/20200203/20200203_plasmids.fasta -s @@ -c ${scratch_dir}/../*ASSEMBLY/03-assembly/unicycler/@@.fasta -a ${scratch_dir}/plasmidID_annotation_config_file.txt --no-trim -o ${scratch_dir} &" > _01_plasmidID.sh
+cat ../samples_id.txt | xargs -I @@ echo "srun --chdir $scratch_dir --output logs/PLASMIDID.@@.%j.log --job-name PLASMIDID_@@ --partition short_idx --time 05:00:00 env - PATH="$PATH" singularity exec --bind /data/ucct/bi/references/ --bind ${scratch_dir} --bind ${scratch_dir}/../../ /data/ucct/bi/pipelines/singularity-images/depot.galaxyproject.org-singularity-plasmidid-1.6.5--hdfd78af_0.img plasmidID -1 ${scratch_dir}/../*ASSEMBLY/01-processing/fastp/@@_1.fastp.fastq.gz -2 ${scratch_dir}/../*ASSEMBLY/01-processing/fastp/@@_2.fastp.fastq.gz -d /data/ucct/bi/references/plasmidID/plasmid_ddbb/20200203/20200203_plasmids.fasta -s @@ -c ${scratch_dir}/../*ASSEMBLY/03-assembly/unicycler/@@.fasta -a ${scratch_dir}/plasmidID_annotation_config_file.txt --no-trim -o ${scratch_dir} &" > _01_plasmidID.sh
 
-echo "srun --chdir $scratch_dir --partition short_idx --time 1:00:00 --output logs/SUMMARY.%j.log env - PATH="$PATH" singularity exec --bind /data/bi/references/ --bind ${scratch_dir} --bind ${scratch_dir}/../../ /data/bi/pipelines/singularity-images/depot.galaxyproject.org-singularity-plasmidid-1.6.5--hdfd78af_0.img summary_report_pid.py -i NO_GROUP -g &" > _02_summary_table.sh
+echo "srun --chdir $scratch_dir --partition short_idx --time 1:00:00 --output logs/SUMMARY.%j.log env - PATH="$PATH" singularity exec --bind /data/ucct/bi/references/ --bind ${scratch_dir} --bind ${scratch_dir}/../../ /data/ucct/bi/pipelines/singularity-images/depot.galaxyproject.org-singularity-plasmidid-1.6.5--hdfd78af_0.img summary_report_pid.py -i NO_GROUP -g &" > _02_summary_table.sh
diff --git a/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/plasmidID_annotation_config_file.txt b/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/plasmidID_annotation_config_file.txt
index 1f286c69a..10a5fa70f 100644
--- a/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/plasmidID_annotation_config_file.txt
+++ b/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/plasmidID_annotation_config_file.txt
@@ -14,24 +14,24 @@
 #DDBBFILE,NANE,P_IDENTITY,P_ALIGNMENT,Q_DIVISOR,Q_SIDE_LR,IS_UNIQUE,DOBLE_UNIQUE,DATABASE_TYPE,COLOR
 
 #INSERTION_SEQUENCES
-#/data/bi/research/20160530_ANTIBIOTICS_PSMP_T/ANALYSIS/PLASMIDID/databases/tn_ncbi.fasta_85,tn,95,50,_,l,n,n,nucl,vlgreen
-#/data/bi/research/20160530_ANTIBIOTICS_PSMP_T/REFERENCES/PLASMIDS/IS_ncbi.fasta_100_90,IS,90,80,_,l,n,n,nucl,vlblue
-#/data/bi/research/20160530_ANTIBIOTICS_PSMP_T/ANALYSIS/PLASMIDID/databases/aditional_IS.fasta,AD_IS,80,10,_,l,n,n,prot,blue
-/data/bi/references/plasmidID/plasmid_annotation/IS_PLASMID_ncbi_prot_90.fasta,IS_PL,90,90,_,l,n,n,prot,vlgreen
+#/data/ucct/bi/research/20160530_ANTIBIOTICS_PSMP_T/ANALYSIS/PLASMIDID/databases/tn_ncbi.fasta_85,tn,95,50,_,l,n,n,nucl,vlgreen
+#/data/ucct/bi/research/20160530_ANTIBIOTICS_PSMP_T/REFERENCES/PLASMIDS/IS_ncbi.fasta_100_90,IS,90,80,_,l,n,n,nucl,vlblue
+#/data/ucct/bi/research/20160530_ANTIBIOTICS_PSMP_T/ANALYSIS/PLASMIDID/databases/aditional_IS.fasta,AD_IS,80,10,_,l,n,n,prot,blue
+/data/ucct/bi/references/plasmidID/plasmid_annotation/IS_PLASMID_ncbi_prot_90.fasta,IS_PL,90,90,_,l,n,n,prot,vlgreen
 #VIRULENCE_FACTORS
-/data/bi/references/plasmidID/plasmid_annotation/virulence_ecoli_eaec_stx_ENT.fasta,VIR_E,80,90,:,l,y,n,nucl,vlorange
-#/data/bi/research/20160530_ANTIBIOTIC/Fatal_outbreak.fasta,VIR_F,50,50,_,l,y,n,prot,purple
-/data/bi/references/plasmidID/plasmid_annotation/ALL_Virulence.fasta,VIR,85,50,:,l,y,n,nucl,lpurple
-/data/bi/references/plasmidID/plasmid_annotation/virulence_plasmid.fasta_90,VIR_PL,50,90, ,l,y,n,prot,orange
-#/data/bi/research/20160530_ANTIBIOTICS_PSMP_T/REFERENCES/PLASMIDS/Yersinia_pestis/Yersinia_pestis_vir.fasta_100,VIR_YP,50,85, ,l,y,n,prot,red
+/data/ucct/bi/references/plasmidID/plasmid_annotation/virulence_ecoli_eaec_stx_ENT.fasta,VIR_E,80,90,:,l,y,n,nucl,vlorange
+#/data/ucct/bi/research/20160530_ANTIBIOTIC/Fatal_outbreak.fasta,VIR_F,50,50,_,l,y,n,prot,purple
+/data/ucct/bi/references/plasmidID/plasmid_annotation/ALL_Virulence.fasta,VIR,85,50,:,l,y,n,nucl,lpurple
+/data/ucct/bi/references/plasmidID/plasmid_annotation/virulence_plasmid.fasta_90,VIR_PL,50,90, ,l,y,n,prot,orange
+#/data/ucct/bi/research/20160530_ANTIBIOTICS_PSMP_T/REFERENCES/PLASMIDS/Yersinia_pestis/Yersinia_pestis_vir.fasta_100,VIR_YP,50,85, ,l,y,n,prot,red
 #PLASMID_TYPING
-/data/bi/references/plasmidID/plasmid_annotation/plasmidFinder_17_07_2018.fsa,inc,90,90,_,l,y,n,nucl,vlyellow
-#/data/bi/research/20160530_ANTIBIOTICS_PSMP_T/ANALYSIS/PLASMIDID/databases/MOB_AlexOrlek.fasta,MOB,30,50,_,l,n,n,prot,dgrey
-/data/bi/references/plasmidID/plasmid_annotation/MOB_ncbi_90.fasta,MOB_ncbi,95,80,_,l,y,n,prot,lgrey
-/data/bi/references/plasmidID/plasmid_annotation/INCLM.fasta,INCLM,30,50,_,l,n,n,prot,dgreen
-/data/bi/references/plasmidID/plasmid_annotation/IncA_C.fasta,INCAC,30,50,_,l,n,n,prot,dgreen
+/data/ucct/bi/references/plasmidID/plasmid_annotation/plasmidFinder_17_07_2018.fsa,inc,90,90,_,l,y,n,nucl,vlyellow
+#/data/ucct/bi/research/20160530_ANTIBIOTICS_PSMP_T/ANALYSIS/PLASMIDID/databases/MOB_AlexOrlek.fasta,MOB,30,50,_,l,n,n,prot,dgrey
+/data/ucct/bi/references/plasmidID/plasmid_annotation/MOB_ncbi_90.fasta,MOB_ncbi,95,80,_,l,y,n,prot,lgrey
+/data/ucct/bi/references/plasmidID/plasmid_annotation/INCLM.fasta,INCLM,30,50,_,l,n,n,prot,dgreen
+/data/ucct/bi/references/plasmidID/plasmid_annotation/IncA_C.fasta,INCAC,30,50,_,l,n,n,prot,dgreen
 #ABR
-/data/bi/references/plasmidID/plasmid_annotation/qacED1.fasta,qacED1,80,50,_,l,y,n,nucl,vlred
-#/data/bi/references/plasmidID/plasmid_annotation/ARGannot.pID.fasta,abr,98,90, ,r,y,-,nucl,vlred
+/data/ucct/bi/references/plasmidID/plasmid_annotation/qacED1.fasta,qacED1,80,50,_,l,y,n,nucl,vlred
+#/data/ucct/bi/references/plasmidID/plasmid_annotation/ARGannot.pID.fasta,abr,98,90, ,r,y,-,nucl,vlred
 #ARIBA CARD
-/data/bi/references/ariba/20191219/card/out.card.fa,card,98,90,.,l,y,-,nucl,vvlred
+/data/ucct/bi/references/ariba/20191219/card/out.card.fa,card,98,90,.,l,y,-,nucl,vvlred
diff --git a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog
index 3ae1bb109..168c45fb5 100644
--- a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog
+++ b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog
@@ -19,7 +19,7 @@ cat <<EOF > rnaseq.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-/data/bi/pipelines/nf-core-rnaseq/nf-core-rnaseq-3.14.0/main.nf \\
+/data/ucct/bi/pipelines/nf-core-rnaseq/nf-core-rnaseq-3.14.0/main.nf \\
           -c ../../DOC/hpc_slurm_rnaseq.config \\
           -params-file ../../DOC/hg38_ensmbl_rnaseq.yml \\
           --input samplesheet.csv \\
diff --git a/bu_isciii/templates/rnaseq/DOC/candida_tropicalis_ncbi.yml b/bu_isciii/templates/rnaseq/DOC/candida_tropicalis_ncbi.yml
index 3b787b13c..a6d3690a8 100644
--- a/bu_isciii/templates/rnaseq/DOC/candida_tropicalis_ncbi.yml
+++ b/bu_isciii/templates/rnaseq/DOC/candida_tropicalis_ncbi.yml
@@ -1,4 +1,4 @@
-fasta: '/data/bi/references/fungi/Candida_tropicalis/GCF_000006335.3_ASM633v3_genomic.fna'
-gtf: '/data/bi/references/fungi/Candida_tropicalis/GCF_000006335.3_ASM633v3_genomic.gff'
-star_index: '/data/bi/references/fungi/Candida_tropicalis/star_V2.7.10a'
-salmon_index: '/data/bi/references/fungi/Candida_tropicalis/salmon_v1.9.0'
+fasta: '/data/ucct/bi/references/fungi/Candida_tropicalis/GCF_000006335.3_ASM633v3_genomic.fna'
+gtf: '/data/ucct/bi/references/fungi/Candida_tropicalis/GCF_000006335.3_ASM633v3_genomic.gff'
+star_index: '/data/ucct/bi/references/fungi/Candida_tropicalis/star_V2.7.10a'
+salmon_index: '/data/ucct/bi/references/fungi/Candida_tropicalis/salmon_v1.9.0'
diff --git a/bu_isciii/templates/rnaseq/DOC/hg38_ensmbl_rnaseq.yml b/bu_isciii/templates/rnaseq/DOC/hg38_ensmbl_rnaseq.yml
index eb85c43e6..f8cd36d24 100644
--- a/bu_isciii/templates/rnaseq/DOC/hg38_ensmbl_rnaseq.yml
+++ b/bu_isciii/templates/rnaseq/DOC/hg38_ensmbl_rnaseq.yml
@@ -1,4 +1,4 @@
-fasta: '/data/bi/references/eukaria/homo_sapiens/hg38/ensemble/genome/Homo_sapiens.GRCh38.dna.toplevel.fa'
-gtf: '/data/bi/references/eukaria/homo_sapiens/hg38/ensemble/gene/Homo_sapiens.GRCh38.98.gtf'
-star_index: '/data/bi/references/eukaria/homo_sapiens/hg38/ensemble/genome/star_V2.7.10a/'
-salmon_index: '/data/bi/references/eukaria/homo_sapiens/hg38/ensemble/genome/salmon_v1.9.0'
+fasta: '/data/ucct/bi/references/eukaria/homo_sapiens/hg38/ensemble/genome/Homo_sapiens.GRCh38.dna.toplevel.fa'
+gtf: '/data/ucct/bi/references/eukaria/homo_sapiens/hg38/ensemble/gene/Homo_sapiens.GRCh38.98.gtf'
+star_index: '/data/ucct/bi/references/eukaria/homo_sapiens/hg38/ensemble/genome/star_V2.7.10a/'
+salmon_index: '/data/ucct/bi/references/eukaria/homo_sapiens/hg38/ensemble/genome/salmon_v1.9.0'
diff --git a/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog b/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog
index 381cbe632..68ec350e3 100644
--- a/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog
+++ b/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog
@@ -21,11 +21,11 @@ cat <<EOF > seek_destroy.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/seek-destroy-nf/seek-destroy-nf-1.0dev/main.nf  \\
+nextflow run /data/ucct/bi/pipelines/seek-destroy-nf/seek-destroy-nf-1.0dev/main.nf  \\
           -c ../../DOC/seek_destroy.config \\
           --input samplesheet.csv \\
-	  --scout_database /data/bi/references/kraken/minikraken_8GB_20200312.tgz \\
-          --host_database  /data/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz \\
+	  --scout_database /data/ucct/bi/references/kraken/minikraken_8GB_20200312.tgz \\
+          --host_database  /data/ucct/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz \\
           --outdir seek_destroy_results \\
           -resume
 EOF
diff --git a/bu_isciii/templates/services.json b/bu_isciii/templates/services.json
index ca5512f4b..e0b1fcc2b 100755
--- a/bu_isciii/templates/services.json
+++ b/bu_isciii/templates/services.json
@@ -2,7 +2,7 @@
     "assembly_annotation": {
         "label": "Bacteria: De novo genome assembly and annotation",
         "template": "assembly",
-        "url": "https://github.com/nf-core/bacass/tree/2.3.1",
+        "url": "https://github.com/nf-core/bacass/tree/2.4.0",
         "order": 1,
         "begin": "",
         "end": "",
diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/01-fastqc/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/01-fastqc/lablog
index 7e822c96f..3ffb0cd3b 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/01-fastqc/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/01-fastqc/lablog
@@ -4,4 +4,4 @@ mkdir logs
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --cpus-per-task 8 --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../00-reads/"$in"_R1.fastq.gz ${scratch_dir}/../00-reads/"$in"_R2.fastq.gz &"; done > _01_rawfastqc.sh
+cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --cpus-per-task 8 --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../00-reads/"$in"_R1.fastq.gz ${scratch_dir}/../00-reads/"$in"_R2.fastq.gz &"; done > _01_rawfastqc.sh
diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/02-preprocessing/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/02-preprocessing/lablog
index 23216d1af..ab3ec5d23 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/02-preprocessing/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/02-preprocessing/lablog
@@ -18,8 +18,8 @@ read -p $'\e[1;37mDid you save the trimmed reads from previous assembly pipeline
     else
 
         mkdir logs
-        scratch_dir=$(echo $(pwd) | sed 's@/data/bi/scratch_tmp/@/scratch/@g')
-        cat ../samples_id.txt | xargs -I @@ echo "mkdir @@; srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name FP.@@ --output logs/FP.@@.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/bi/pipelines/singularity-images/fastp:0.20.0--hdbcaa40_0 fastp --in1 ${scratch_dir}/../00-reads/@@_R1.fastq.gz --in2 ${scratch_dir}/../00-reads/@@_R2.fastq.gz --thread 5 --cut_front --cut_tail --cut_mean_quality 15 --qualified_quality_phred 15 --trim_poly_x --detect_adapter_for_pe --json ${scratch_dir}/@@/@@_fastp.json --html ${scratch_dir}/@@/@@_fastp.html --out1 ${scratch_dir}/@@/@@_R1_filtered.fastq.gz --out2 ${scratch_dir}/@@/@@_R2_filtered.fastq.gz &" > _01_fastp.sh
+        scratch_dir=$(echo $(pwd) | sed 's@/data/ucct/bi/scratch_tmp/@/scratch/@g')
+        cat ../samples_id.txt | xargs -I @@ echo "mkdir @@; srun --chdir ${scratch_dir} --mem 10G --time 1:00:00 --job-name FP.@@ --output logs/FP.@@.%j.log --partition short_idx --cpus-per-task 5 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/ucct/bi/pipelines/singularity-images/fastp:0.20.0--hdbcaa40_0 fastp --in1 ${scratch_dir}/../00-reads/@@_R1.fastq.gz --in2 ${scratch_dir}/../00-reads/@@_R2.fastq.gz --thread 5 --cut_front --cut_tail --cut_mean_quality 15 --qualified_quality_phred 15 --trim_poly_x --detect_adapter_for_pe --json ${scratch_dir}/@@/@@_fastp.json --html ${scratch_dir}/@@/@@_fastp.html --out1 ${scratch_dir}/@@/@@_R1_filtered.fastq.gz --out2 ${scratch_dir}/@@/@@_R2_filtered.fastq.gz &" > _01_fastp.sh
 
         echo -e "\e[32mFile _01_fastp.sh ready.\e[0m"
         
diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/03-preprocQC/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/03-preprocQC/lablog
index ea022ef7b..938fb2161 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/03-preprocQC/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/03-preprocQC/lablog
@@ -4,4 +4,4 @@ mkdir logs
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --cpus-per-task 8 --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz &"; done > _01_trimmedfastqc.sh
+cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --cpus-per-task 8 --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz &"; done > _01_trimmedfastqc.sh
diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog
index 6154d78bf..071496b97 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog
@@ -6,10 +6,10 @@ mkdir logs
 
 cat ../samples_id.txt | while read in; do echo -e "${in}\t${scratch_dir}/../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz\t${scratch_dir}/../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz"; done >> input.tab
 
-ls ${scratch_dir}/../../../REFERENCES | xargs -I %% singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 snippy-multi ${scratch_dir}/input.tab --mincov 9 --mapqual 10 --basequal 5 --minqual 30 --ref ${scratch_dir}/../../../REFERENCES/%% --cpus 5 > commands.out
+ls ${scratch_dir}/../../../REFERENCES | xargs -I %% singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 snippy-multi ${scratch_dir}/input.tab --mincov 9 --mapqual 10 --basequal 5 --minqual 30 --ref ${scratch_dir}/../../../REFERENCES/%% --cpus 5 > commands.out
 
-head -n -1 commands.out | sed -e "s@^@srun --chdir ${scratch_dir} --output logs/SNIPPY.%j.log --job-name SNIPPY --cpus-per-task 5 --mem 49152 --partition short_idx --time 02:00:00 env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 @" | awk '{print $0" &"}' > _00_snippy.sh
-tail -n 1 commands.out | sed -e "s@^@srun --chdir ${scratch_dir} --output logs/SNIPPY_CORE.%j.log --job-name SNIPPY --cpus-per-task 5 --mem 49152 --partition short_idx --time 02:00:00 env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 @" | awk '{print $0" &"}' > _01_snippy_core.sh
+head -n -1 commands.out | sed -e "s@^@srun --chdir ${scratch_dir} --output logs/SNIPPY.%j.log --job-name SNIPPY --cpus-per-task 5 --mem 49152 --partition short_idx --time 02:00:00 env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 @" | awk '{print $0" &"}' > _00_snippy.sh
+tail -n 1 commands.out | sed -e "s@^@srun --chdir ${scratch_dir} --output logs/SNIPPY_CORE.%j.log --job-name SNIPPY --cpus-per-task 5 --mem 49152 --partition short_idx --time 02:00:00 env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 @" | awk '{print $0" &"}' > _01_snippy_core.sh
 
 
 
@@ -19,7 +19,7 @@ tail -n 1 commands.out | sed -e "s@^@srun --chdir ${scratch_dir} --output logs/S
 # echo "grep \"complex\" ./*/snps.vcf | cut -f 1,2,4,5 | cut -d \":\" -f 2 | sort -u | awk '{pos1=\$2; len_ref=length(\$3); printf \"%s\t%s\t%s\n\", \$1, pos1-1, pos1+len_ref+1}' | grep -v \"^#\" > mask_complex_variants.bed" > _01_snippy_core.sh
 # ls ${scratch_dir}/../../../REFERENCES | xargs -I %% echo "snippy-core --debug --mask ./mask_complex_variants.bed --mask-char 'N' --ref '../../../REFERENCES/%%' $(cat ../samples_id.txt | xargs)" >> _01_snippy_core.sh
 
-echo "srun --chdir ${scratch_dir} --output logs/SNIP-SITES.%j.log --job-name SNIP-SITES --cpus-per-task 5 --mem 49152 --partition short_idx --time 02:00:00 env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 snp-sites -b -c -o phylo.aln core.full.aln &" > _02_phylo_aln.sh
+echo "srun --chdir ${scratch_dir} --output logs/SNIP-SITES.%j.log --job-name SNIP-SITES --cpus-per-task 5 --mem 49152 --partition short_idx --time 02:00:00 env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 snp-sites -b -c -o phylo.aln core.full.aln &" > _02_phylo_aln.sh
 
 # awk 'BEGIN{FS="[> ]"} /^>/{val=$2;next}  {print val,length($0)}' phylo.aln
 
@@ -27,8 +27,8 @@ echo "srun --chdir ${scratch_dir} --output logs/SNIP-SITES.%j.log --job-name SNI
 # awk '$4 != $5 || $4 != $6 || $5 != $6' core.tab > differences.txt
 
 ## GUBBINS commands
-echo "env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 snippy-clean_full_aln core.full.aln > clean.full.aln" > _03_gubbins.sh
-echo "singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gubbins:3.3.5--py39pl5321he4a0461_0 run_gubbins.py --threads 20 -p gubbins clean.full.aln" >> _03_gubbins.sh
-echo "env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 snp-sites -c gubbins.filtered_polymorphic_sites.fasta > clean.core.aln" >> _03_gubbins.sh
+echo "env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 snippy-clean_full_aln core.full.aln > clean.full.aln" > _03_gubbins.sh
+echo "singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gubbins:3.3.5--py39pl5321he4a0461_0 run_gubbins.py --threads 20 -p gubbins clean.full.aln" >> _03_gubbins.sh
+echo "env - PATH="$PATH" singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/snippy:4.6.0--hdfd78af_4 snp-sites -c gubbins.filtered_polymorphic_sites.fasta > clean.core.aln" >> _03_gubbins.sh
 # Run gubbins
 echo "srun --chdir ${scratch_dir} --output logs/GUBBINS.%j.log --job-name GUBBINS --cpus-per-task 20 --mem 49152 --partition short_idx --time 02:00:00 bash _03_gubbins.sh &" > _03_run_gubbins.sh
diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog
index f40bd67d9..756b8b09f 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog
@@ -2,5 +2,5 @@
 
 scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
 mkdir logs
-#echo "srun --chdir ${scratch_dir} --output logs/IQTREEMFP.%j.log --job-name IQTREEMFP --cpus-per-task 20 --mem 5G --partition short_idx --time 00:30:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../04-snippy/phylo.aln -m MFP &" > _00_iqtreemfp.sh
-echo "srun --chdir ${scratch_dir} --output logs/IQTREEFULLALIGN.%j.log --job-name IQTREEFULLALIGN --cpus-per-task 20 --mem 15G --partition short_idx --time 08:00:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../04-snippy/phylo.aln -m HKY+F+I -T 20 -B 1000 -pre phylo.iqtree.bootstrap &" > _01_iqtreeall.sh
+#echo "srun --chdir ${scratch_dir} --output logs/IQTREEMFP.%j.log --job-name IQTREEMFP --cpus-per-task 20 --mem 5G --partition short_idx --time 00:30:00 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../04-snippy/phylo.aln -m MFP &" > _00_iqtreemfp.sh
+echo "srun --chdir ${scratch_dir} --output logs/IQTREEFULLALIGN.%j.log --job-name IQTREEFULLALIGN --cpus-per-task 20 --mem 15G --partition short_idx --time 08:00:00 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../04-snippy/phylo.aln -m HKY+F+I -T 20 -B 1000 -pre phylo.iqtree.bootstrap &" > _01_iqtreeall.sh
diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/99-stats/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/99-stats/lablog
index 5c36198f4..1739247ee 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/99-stats/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/99-stats/lablog
@@ -4,9 +4,9 @@ ln -s ../../../REFERENCES/*.fna reference.fna
 mkdir logs
 scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
 
-cat ../samples_id.txt | xargs -I % echo "printf '%s\t' %;singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools flagstat ${scratch_dir}/../04-snippy/%/snps.bam | grep 'mapped (' | head -n 1 | cut -d '(' -f 2 | cut -d ':' -f 1" | bash | sort -u > mapping_stats.txt
+cat ../samples_id.txt | xargs -I % echo "printf '%s\t' %;singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools flagstat ${scratch_dir}/../04-snippy/%/snps.bam | grep 'mapped (' | head -n 1 | cut -d '(' -f 2 | cut -d ':' -f 1" | bash | sort -u > mapping_stats.txt
 
-cat ../samples_id.txt | xargs -I @@ echo "srun --chdir $scratch_dir --output logs/PICARD_@@.%j.log --job-name picard_@@ --partition short_idx --time 2:00:00 singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectWgsMetrics -VALIDATION_STRINGENCY LENIENT -I ${scratch_dir}/../04-snippy/@@/snps.bam -O ${scratch_dir}/@@_collect_wgs_metrics.txt -R ${scratch_dir}/reference.fna &" > _00_wgsmetrics.sh
+cat ../samples_id.txt | xargs -I @@ echo "srun --chdir $scratch_dir --output logs/PICARD_@@.%j.log --job-name picard_@@ --partition short_idx --time 2:00:00 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectWgsMetrics -VALIDATION_STRINGENCY LENIENT -I ${scratch_dir}/../04-snippy/@@/snps.bam -O ${scratch_dir}/@@_collect_wgs_metrics.txt -R ${scratch_dir}/reference.fna &" > _00_wgsmetrics.sh
 
 echo "printf \"SAMPLENAME\t\$(grep \"GENOME_TERRITORY\" *collect_wgs_metrics.txt | cut -d\":\" -f2 | sed 's/ /_/g'| sort -u)\n\" > wgs_metrics_all.txt" > _01_gather_wgs_metrics.sh
 echo "cat ../samples_id.txt | xargs -I % echo \"printf '%s\t' %; head -n 8 %_collect_wgs_metrics.txt | grep '^[0-9]'\" | bash >> wgs_metrics_all.txt" >> _01_gather_wgs_metrics.sh
diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index f80d4524a..2a829ba76 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -75,12 +75,12 @@ update_pangolin() {
     log_message "Latest version available of Pangolin:\e[1;38;5;220m $latest_version_pangolin" bold
 
     log_message "Checking if latest version of Pangolin image is already downloaded..."
-    if [ -e "/data/bi/pipelines/singularity-images/$latest_version_pangolin" ]; then
+    if [ -e "/data/ucct/bi/pipelines/singularity-images/$latest_version_pangolin" ]; then
         log_message "File $latest_version_pangolin already downloaded."
         log_message "Pangolin container is UP TO DATE. \xE2\x9C\x85"
     else
         log_message "Downloading $latest_version_pangolin file..."
-        wget -P "/data/bi/pipelines/singularity-images/" "https://depot.galaxyproject.org/singularity/$latest_version_pangolin"
+        wget -P "/data/ucct/bi/pipelines/singularity-images/" "https://depot.galaxyproject.org/singularity/$latest_version_pangolin"
         if [ $? -eq 0 ]; then
             log_message "$latest_version_pangolin file succesfully downloaded." green
         else
@@ -90,16 +90,16 @@ update_pangolin() {
 
     # Updating Pangolin database
     log_message "Setting datadir for Pangolin database."
-    cd /data/bi/references/pangolin/
+    cd /data/ucct/bi/references/pangolin/
     if [ -e "./$(date '+%Y%m%d')" ]; then
-        log_message "Directory /data/bi/references/pangolin/$(date '+%Y%m%d') already exists. Assuming that a BU-ISCIII member previously updated pangolin database today. \xE2\x9C\x85"
+        log_message "Directory /data/ucct/bi/references/pangolin/$(date '+%Y%m%d') already exists. Assuming that a BU-ISCIII member previously updated pangolin database today. \xE2\x9C\x85"
         log_message "$(grep pangolin "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")" green
         log_message "$(grep constellations "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")" green
     else
         mkdir "$(date '+%Y%m%d')"
         echo -e "$(date +'%Y-%m-%d %H:%M:%S') - mkdir $(date '+%Y%m%d')" >> $(date '+%Y%m%d')/command.log
-        echo -e "$(date +'%Y-%m-%d %H:%M:%S') - srun --partition short_idx --output ${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log singularity run -B ${PWD} /data/bi/pipelines/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/)" >> $(date '+%Y%m%d')/command.log
-        srun --partition short_idx --output ${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log singularity run -B ${PWD} /data/bi/pipelines/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/
+        echo -e "$(date +'%Y-%m-%d %H:%M:%S') - srun --partition short_idx --output ${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log singularity run -B ${PWD} /data/ucct/bi/pipelines/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/)" >> $(date '+%Y%m%d')/command.log
+        srun --partition short_idx --output ${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log singularity run -B ${PWD} /data/ucct/bi/pipelines/singularity-images/$latest_version_pangolin pangolin --update-data --datadir ${PWD}/$(date '+%Y%m%d')/
         if [ $? -eq 0 ]; then
             log_message "$(grep pangolin "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")" green
             log_message "$(grep constellations "${PWD}/$(date '+%Y%m%d')/$(date '+%Y%m%d')_pangolin.log")" green
@@ -112,7 +112,7 @@ update_pangolin() {
     # Updating config file
     log_message "Updating $CONFIG_FILE file..."
     sed -i "s|pangolin:4.3--pyhdfd78af_2|$latest_version_pangolin|" "$CONFIG_FILE"
-    sed -i "s|--datadir XXXX|--datadir $(ls -dt /data/bi/references/pangolin/*/ | head -n 1)|" "$CONFIG_FILE"
+    sed -i "s|--datadir XXXX|--datadir $(ls -dt /data/ucct/bi/references/pangolin/*/ | head -n 1)|" "$CONFIG_FILE"
     log_message "File $CONFIG_FILE UPDATED."
 
     # Updating params file
@@ -134,12 +134,12 @@ update_nextclade() {
     log_message "Latest version available of Nextclade:\e[1;38;5;220m $latest_version_nextclade" bold
 
     log_message "Checking if latest version of Nextclade image is already downloaded..."
-    if [ -e "/data/bi/pipelines/singularity-images/$latest_version_nextclade" ]; then
+    if [ -e "/data/ucct/bi/pipelines/singularity-images/$latest_version_nextclade" ]; then
         log_message "File $latest_version_nextclade already downloaded."
         log_message "Nextclade container is UP TO DATE. \xE2\x9C\x85"
     else
         log_message "Downloading $latest_version_nextclade file..."
-        wget -P "/data/bi/pipelines/singularity-images" "https://depot.galaxyproject.org/singularity/$latest_version_nextclade"
+        wget -P "/data/ucct/bi/pipelines/singularity-images" "https://depot.galaxyproject.org/singularity/$latest_version_nextclade"
         if [ $? -eq 0 ]; then
             log_message "$latest_version_nextclade file succesfully downloaded." green
         else
@@ -149,7 +149,7 @@ update_nextclade() {
 
     # Extracting the current Nextclade data TAG
     log_message "Extracting Nextclade data TAG..."
-    nextclade_tag=$(singularity run /data/bi/pipelines/singularity-images/$latest_version_nextclade nextclade dataset list --json | grep -zoP "\"path\":\s*\"nextstrain/${virus_tag}[^\"]*\"[\s\S]*?\"tag\":\s*\"\K[^\"]*" | tr '\0' '\n' | head -n 1)
+    nextclade_tag=$(singularity run /data/ucct/bi/pipelines/singularity-images/$latest_version_nextclade nextclade dataset list --json | grep -zoP "\"path\":\s*\"nextstrain/${virus_tag}[^\"]*\"[\s\S]*?\"tag\":\s*\"\K[^\"]*" | tr '\0' '\n' | head -n 1)
     log_message "Latest \e[1;38;5;220m${virus_tag^^} \e[1;37mNextclade dataset version TAG:\e[1;38;5;220m $nextclade_tag" bold
     
     # Updating config file
@@ -192,7 +192,7 @@ check_references() {
     }
 
     # Check if FASTA sequence is already downloaded
-    REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+    REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/ucct/bi/references/refgenie/alias/references.txt)
     if [ -z "$REF_FASTA" ]; then
         log_message "File ${ref}.fasta is not yet downloaded."
         obtain_family; if [ -z $family ]; then return; fi
@@ -214,20 +214,20 @@ check_references() {
             log_message "Refgenie environment is NOT ACTIVE. Exiting..." blk_red
             exit 1
         fi
-        if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exists
-            log_message "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.fasta in /data/bi/references/refgenie/alias/${family}/fasta/${ref}."
+        if [ ! -e "/data/ucct/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exists
+            log_message "Creating new directory: /data/ucct/bi/references/refgenie/alias/${family}/ and saving file ${ref}.fasta in /data/ucct/bi/references/refgenie/alias/${family}/fasta/${ref}."
             digest=$(openssl rand -hex 24)
-            mkdir -p /data/bi/references/refgenie/data/${digest}/fasta/${ref}/
-            wget -q -O "/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
+            mkdir -p /data/ucct/bi/references/refgenie/data/${digest}/fasta/${ref}/
+            wget -q -O "/data/ucct/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
             if [ $? -eq 0 ]; then
-                log_message "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}." green
-                gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
+                log_message "File ${ref}.fasta downloaded in /data/ucct/bi/references/refgenie/data/${digest}/fasta/${ref}." green
+                gzip /data/ucct/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
                 log_message "Building asset for ${ref}.fasta file..."
-                refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R > ${ref}.fasta_build.log 2>&1
+                refgenie build ${family}/fasta:${ref} --files fasta=/data/ucct/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/ucct/bi/references/refgenie/genome_config.yaml -R > ${ref}.fasta_build.log 2>&1
                 if grep -q "Created" "${ref}.fasta_build.log"; then
-                    log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)" bold
-                    bash /data/bi/references/refgenie/alias/ref.sh
-                    REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+                    log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/ucct/bi/references/refgenie/alias/" ${ref}.fasta_build.log)" bold
+                    bash /data/ucct/bi/references/refgenie/alias/ref.sh
+                    REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/ucct/bi/references/refgenie/alias/references.txt)
                 else
                     log_message "An error ocurred during building asset for ${ref}.fasta file." blk_red
                 fi
@@ -235,19 +235,19 @@ check_references() {
                 log_message "An error occurred during file downloading." blk_red
             fi
         else
-            log_message "Directory /data/bi/references/refgenie/alias/${family}/ ALREADY EXISTS. Downloading ${ref}.fasta."
-            digest=$(refgenie alias get -a ${family} -c /data/bi/references/refgenie/genome_config.yaml)
-            mkdir -p /data/bi/references/refgenie/data/${digest}/fasta/${ref}/
-            wget -q -O "/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
+            log_message "Directory /data/ucct/bi/references/refgenie/alias/${family}/ ALREADY EXISTS. Downloading ${ref}.fasta."
+            digest=$(refgenie alias get -a ${family} -c /data/ucct/bi/references/refgenie/genome_config.yaml)
+            mkdir -p /data/ucct/bi/references/refgenie/data/${digest}/fasta/${ref}/
+            wget -q -O "/data/ucct/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta" "https://eutils.ncbi.nlm.nih.gov/entrez/eutils/efetch.fcgi?db=nuccore&id=${ref}&rettype=fasta&retmode=text"
             if [ $? -eq 0 ]; then 
-                log_message "File ${ref}.fasta downloaded in /data/bi/references/refgenie/data/${digest}/fasta/${ref}." green
-                gzip /data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
+                log_message "File ${ref}.fasta downloaded in /data/ucct/bi/references/refgenie/data/${digest}/fasta/${ref}." green
+                gzip /data/ucct/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta
                 log_message "Building asset for ${ref}.fasta file..."
-                refgenie build ${family}/fasta:${ref} --files fasta=/data/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/bi/references/refgenie/genome_config.yaml -R > ${ref}.fasta_build.log 2>&1
+                refgenie build ${family}/fasta:${ref} --files fasta=/data/ucct/bi/references/refgenie/data/${digest}/fasta/${ref}/${ref}.fasta.gz -c /data/ucct/bi/references/refgenie/genome_config.yaml -R > ${ref}.fasta_build.log 2>&1
                 if grep -q "Created" "${ref}.fasta_build.log"; then
-                    log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.fasta_build.log)" bold
-                    bash /data/bi/references/refgenie/alias/ref.sh
-                    REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+                    log_message "$(grep Created ${ref}.fasta_build.log) $(grep "/data/ucct/bi/references/refgenie/alias/" ${ref}.fasta_build.log)" bold
+                    bash /data/ucct/bi/references/refgenie/alias/ref.sh
+                    REF_FASTA=$(awk -v ref="$ref" '$0 ~ ref && /fasta/ {print $4}' /data/ucct/bi/references/refgenie/alias/references.txt)
                 else
                     log_message "An error ocurred during building asset for ${ref}.fasta file." blk_red
                 fi
@@ -260,7 +260,7 @@ check_references() {
     fi
 
     # Check if GFF file is already downloaded
-    REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+    REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/ucct/bi/references/refgenie/alias/references.txt)
     if [ -z "$REF_GFF" ]; then
         log_message "File ${ref}.gff is not yet downloaded."
         if [ ! -v family ]; then obtain_family; if [ -z ${family} ]; then return; fi; fi
@@ -274,20 +274,20 @@ check_references() {
                 log_message "Refgenie environment is NOT ACTIVE. Exiting..." blk_red
             fi
         fi
-        if [ ! -e "/data/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exist
-            log_message "Creating new directory: /data/bi/references/refgenie/alias/${family}/ and saving file ${ref}.gff in /data/bi/references/refgenie/alias/${family}/gff/${ref}."
+        if [ ! -e "/data/ucct/bi/references/refgenie/alias/${family}" ]; then # Check if directory doesn't exist
+            log_message "Creating new directory: /data/ucct/bi/references/refgenie/alias/${family}/ and saving file ${ref}.gff in /data/ucct/bi/references/refgenie/alias/${family}/gff/${ref}."
             digest=$(openssl rand -hex 24)
-            refgenie alias set --aliases ${family} --digest ${digest} -f -c /data/bi/references/refgenie/genome_config.yaml
-            mkdir -p /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/
-            wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${family}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
+            refgenie alias set --aliases ${family} --digest ${digest} -f -c /data/ucct/bi/references/refgenie/genome_config.yaml
+            mkdir -p /data/ucct/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/
+            wget -q -O "/data/ucct/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${family}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
             if [ $? -eq 0 ]; then
-                log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}." green
+                log_message "File ${ref}.gff downloaded in /data/ucct/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}." green
                 log_message "Adding asset for ${ref}.gff file..."
-                refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml > ${ref}.gff_add.log 2>&1
+                refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/ucct/bi/references/refgenie/genome_config.yaml > ${ref}.gff_add.log 2>&1
                 if grep -q "Created" "${ref}.gff_add.log"; then
-                    log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)" bold
-                    bash /data/bi/references/refgenie/alias/ref.sh
-                    REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+                    log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/ucct/bi/references/refgenie/alias/" ${ref}.gff_add.log)" bold
+                    bash /data/ucct/bi/references/refgenie/alias/ref.sh
+                    REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/ucct/bi/references/refgenie/alias/references.txt)
                 else
                     log_message "An error ocurred during adding asset for ${ref}.gff file." blk_red
                 fi
@@ -295,18 +295,18 @@ check_references() {
                 log_message "An error occurred during file downloading." blk_red
             fi
          else
-            log_message "Directory /data/bi/references/refgenie/alias/${family}/ ALREADY EXISTS. Downloading ${ref}.gff."
-            digest=$(refgenie alias get -a ${family} -c /data/bi/references/refgenie/genome_config.yaml)
-            mkdir -p /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/
-            wget -q -O "/data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${family}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
+            log_message "Directory /data/ucct/bi/references/refgenie/alias/${family}/ ALREADY EXISTS. Downloading ${ref}.gff."
+            digest=$(refgenie alias get -a ${family} -c /data/ucct/bi/references/refgenie/genome_config.yaml)
+            mkdir -p /data/ucct/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/
+            wget -q -O "/data/ucct/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}/${family}.gff" "https://www.ncbi.nlm.nih.gov/sviewer/viewer.cgi?db=nuccore&report=gff3&id=${ref}"
             if [ $? -eq 0 ]; then 
-                log_message "File ${ref}.gff downloaded in /data/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}." green
+                log_message "File ${ref}.gff downloaded in /data/ucct/bi/references/refgenie/data/${digest}/ensembl_rb/${ref}." green
                 log_message "Adding asset for ${ref}.gff file..."
-                refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/bi/references/refgenie/genome_config.yaml > ${ref}.gff_add.log 2>&1
+                refgenie add ${family}/gff:${ref} --path data/${digest}/ensembl_rb/${ref}/ --seek-keys '{"gff" : "'"${family}.gff"'"}' -c /data/ucct/bi/references/refgenie/genome_config.yaml > ${ref}.gff_add.log 2>&1
                 if grep -q "Created" "${ref}.gff_add.log"; then
-                    log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/bi/references/refgenie/alias/" ${ref}.gff_add.log)" bold
-                    bash /data/bi/references/refgenie/alias/ref.sh
-                    REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/bi/references/refgenie/alias/references.txt)
+                    log_message "$(grep Created ${ref}.gff_add.log) $(grep "/data/ucct/bi/references/refgenie/alias/" ${ref}.gff_add.log)" bold
+                    bash /data/ucct/bi/references/refgenie/alias/ref.sh
+                    REF_GFF=$(awk -v ref="$ref" '$0 ~ ref && /gff/ {print $4}' /data/ucct/bi/references/refgenie/alias/references.txt)
                 else
                     log_message "An error ocurred during adding asset for ${ref}.gff file." blk_red
                 fi
@@ -455,7 +455,7 @@ else
         update_nextclade
         update_pangolin
 
-        echo "primer_bed: '/data/bi/references/refgenie/alias/coronaviridae/primer_schemes/NC_045512.2/artic_v4-1_ncov-2019-primer.scheme.bed'" >> $PARAMS_FILE
+        echo "primer_bed: '/data/ucct/bi/references/refgenie/alias/coronaviridae/primer_schemes/NC_045512.2/artic_v4-1_ncov-2019-primer.scheme.bed'" >> $PARAMS_FILE
 
     elif [ "$virus_tag" == "rsv" ]; then       
         # Update Nextclade
@@ -503,7 +503,7 @@ do
         echo "#SBATCH --output ${ref}_$(date '+%Y%m%d')_viralrecon.log" >> ${FOLDER_NAME}/lablog
         printf "#SBATCH --chdir \$scratch_dir\n\n" >> ${FOLDER_NAME}/lablog
         printf 'export NXF_OPTS="-Xms500M -Xmx4G"\n\n' >> ${FOLDER_NAME}/lablog
-        echo "nextflow run /data/bi/pipelines/nf-core-viralrecon/nf-core-viralrecon-2.6.0/workflow/main.nf \\\\" >> ${FOLDER_NAME}/lablog
+        echo "nextflow run /data/ucct/bi/pipelines/nf-core-viralrecon/nf-core-viralrecon-2.6.0/workflow/main.nf \\\\" >> ${FOLDER_NAME}/lablog
         echo "          -c ../${CONFIG_FILE} \\\\" >> ${FOLDER_NAME}/lablog
         echo "          -params-file ../${PARAMS_FILE} \\\\" >> ${FOLDER_NAME}/lablog
         echo "          --input samplesheet_${ref}.csv \\\\" >> ${FOLDER_NAME}/lablog
diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon.config b/bu_isciii/templates/viralrecon/DOC/viralrecon.config
index 4b5f4e2a5..cf7f9c2d1 100644
--- a/bu_isciii/templates/viralrecon/DOC/viralrecon.config
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon.config
@@ -1,7 +1,7 @@
 singularity {
 	enabled = true
 	autoMounts = true
-        runOptions = '-B /data/bi/references/ -B "$HOME"'
+        runOptions = '-B /data/ucct/bi/references/ -B "$HOME"'
 }
 
 process {
diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon_no_host_reads.config b/bu_isciii/templates/viralrecon/DOC/viralrecon_no_host_reads.config
index 7bc082ef8..5dd639d65 100644
--- a/bu_isciii/templates/viralrecon/DOC/viralrecon_no_host_reads.config
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon_no_host_reads.config
@@ -1,7 +1,7 @@
 singularity {
         enabled = true
         autoMounts = true
-        runOptions = '-B /data/bi/references/ -B "$HOME"'
+        runOptions = '-B /data/ucct/bi/references/ -B "$HOME"'
 }
 
 process {
diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon_params.yml b/bu_isciii/templates/viralrecon/DOC/viralrecon_params.yml
index 8f854848c..8c2508ef0 100644
--- a/bu_isciii/templates/viralrecon/DOC/viralrecon_params.yml
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon_params.yml
@@ -1,6 +1,6 @@
 platform: 'illumina'
 protocol: 'metagenomic'
-kraken2_db: '/data/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz'
+kraken2_db: '/data/ucct/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz'
 variant_caller: 'ivar' 
 consensus_caller: 'bcftools'
 skip_pangolin: true
diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config
index 865d1a0d2..06875ddbd 100644
--- a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore.config
@@ -1,7 +1,7 @@
 singularity {
 	enabled = true
 	autoMounts = true
-        runOptions = '-B /data/bi/references/'
+        runOptions = '-B /data/ucct/bi/references/'
 }
 
 process {
@@ -10,12 +10,12 @@ process {
         withName: 'ARTIC_MINION' {
             ext.args = [
                 '--normalise 500',
-                '--scheme-directory /data/bi/references/virus/2019-nCoV/primer_schemes/',
+                '--scheme-directory /data/ucct/bi/references/virus/2019-nCoV/primer_schemes/',
                 '--medaka'
             ].join(' ').trim()
         }
         withName: 'PANGOLIN' {
-            ext.args = '--datadir /data/bi/references/pangolin/20230227/'
+            ext.args = '--datadir /data/ucct/bi/references/pangolin/20230227/'
             container = 'https://depot.galaxyproject.org/singularity/pangolin:4.2--pyhdfd78af_1'
         }
 	withName: 'NEXTCLADE_DATASETGET|NEXTCLADE_RUN' {
diff --git a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml
index 7134065a0..285b793b2 100644
--- a/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml
+++ b/bu_isciii/templates/viralrecon/DOC/viralrecon_sars_nanopore_params.yml
@@ -2,10 +2,10 @@ platform: 'nanopore'
 protocol: 'amplicon'
 artic_scheme: 'nCoV-2019'
 primer_set_version: 5
-fasta: '/data/bi/references/virus/2019-nCoV/primer_schemes/nCoV-2019/V5/ESIB-EQA.reference.fasta'
-primer_bed: '/data/bi/references/virus/2019-nCoV/primer_schemes/nCoV-2019/V5/ESIB-EQA.primer.bed'
+fasta: '/data/ucct/bi/references/virus/2019-nCoV/primer_schemes/nCoV-2019/V5/ESIB-EQA.reference.fasta'
+primer_bed: '/data/ucct/bi/references/virus/2019-nCoV/primer_schemes/nCoV-2019/V5/ESIB-EQA.primer.bed'
 primer_fasta: '../../RAW/ESIB_EQA_2023.SARS1/ESIB_EQA_2023.SARS1.primers.fasta'
-kraken2_db: '/data/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz'
+kraken2_db: '/data/ucct/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz'
 nextclade_dataset_name: 'sars-cov-2'
 nextclade_dataset: false
 nextclade_dataset_tag: '2023-02-25T12:00:00Z'
diff --git a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/02-postprocessing/lablog b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/02-postprocessing/lablog
index 32414d09b..0c971e16e 100644
--- a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/02-postprocessing/lablog
+++ b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/02-postprocessing/lablog
@@ -6,17 +6,17 @@ scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
 mkdir -p logs
 
-echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/SELECTSNPS.log --job-name SELECTSNPS singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk SelectVariants \
+echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/SELECTSNPS.log --job-name SELECTSNPS singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk SelectVariants \
      -V ${scratch_dir}/../01-sarek/variant_calling/haplotypecaller/joint_variant_calling/joint_germline.vcf.gz \
      -select-type SNP \
      -O ${scratch_dir}/snps.vcf.gz &" > _01_separate_snps_indels.sh
 
-echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/SELECTINDELS.log --job-name SELECTINDELS singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk SelectVariants \
+echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/SELECTINDELS.log --job-name SELECTINDELS singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk SelectVariants \
     -V ${scratch_dir}/../01-sarek/variant_calling/haplotypecaller/joint_variant_calling/joint_germline.vcf.gz \
     -select-type INDEL \
     -O ${scratch_dir}/indels.vcf.gz &" >> _01_separate_snps_indels.sh
 
-echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/FILSNP.log --job-name FILSNP singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk VariantFiltration \
+echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/FILSNP.log --job-name FILSNP singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk VariantFiltration \
 	-V ${scratch_dir}/snps.vcf.gz \
 	-filter 'QD < 2.0' --filter-name 'QD2' \
 	-filter 'QUAL < 30.0' --filter-name 'QUAL30' \
@@ -27,7 +27,7 @@ echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output
 	-filter 'ReadPosRankSum < -8.0' --filter-name 'ReadPosRankSum-8' \
 	-O ${scratch_dir}/snps_filtered.vcf.gz &" > _02_filter.sh
 
-echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/FILINDEL.log --job-name FILINDEL singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk VariantFiltration \
+echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/FILINDEL.log --job-name FILINDEL singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk VariantFiltration \
 	-V ${scratch_dir}/indels.vcf.gz \
 	-filter 'QD < 2.0' --filter-name 'QD2' \
 	-filter 'QUAL < 30.0' --filter-name 'QUAL30' \
@@ -35,7 +35,7 @@ echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output
 	-filter 'ReadPosRankSum < -20.0' --filter-name 'ReadPosRankSum-20' \
 	-O ${scratch_dir}/indels_filtered.vcf.gz &" >> _02_filter.sh
 
-echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/MERGEVCF.log --job-name MERGEVCF singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk MergeVcfs \
+echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/MERGEVCF.log --job-name MERGEVCF singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/gatk4-spark:4.2.0.0--hdfd78af_1 gatk MergeVcfs \
 	-I ${scratch_dir}/snps_filtered.vcf.gz \
 	-I ${scratch_dir}/indels_filtered.vcf.gz \
 	-O ${scratch_dir}/variants_fil.vcf.gz &" > _03_merge_vcfs.sh
diff --git a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/03-annotation/lablog b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/03-annotation/lablog
index c6a964bd1..246e919a5 100644
--- a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/03-annotation/lablog
+++ b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/03-annotation/lablog
@@ -3,8 +3,8 @@
 
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 
-ln -s /data/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37-4.3/dbNSFP_ENSG_gene_GRCh37.txt
-ln -s /data/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37-4.3/dbNSFP_ENSG_plugin_hg19.txt
+ln -s /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37-4.3/dbNSFP_ENSG_gene_GRCh37.txt
+ln -s /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37-4.3/dbNSFP_ENSG_plugin_hg19.txt
 mkdir -p vep
 mkdir -p logs
 mkdir -p exomiser/{exomiser,exomiser_exome,exomiser_genes}
@@ -21,7 +21,7 @@ echo "sed -i 's/\t$//' ./vep/variants_fil_mod.vcf" >> aux_01_bcftools_query.sh
 
 # 2. Create variant table.
 
-echo "singularity exec -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/bcftools:1.12--h45bccc9_1 bcftools query -H -f '%CHROM\t%POS\t%ID\t%REF\t%ALT\t%FILTER\t[%GT\t%DP\t%AD\t%GQ\t]\n' ${scratch_dir}/vep/variants_fil_mod.vcf > ${scratch_dir}/vep/variants.table" >> aux_01_bcftools_query.sh
+echo "singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/bcftools:1.12--h45bccc9_1 bcftools query -H -f '%CHROM\t%POS\t%ID\t%REF\t%ALT\t%FILTER\t[%GT\t%DP\t%AD\t%GQ\t]\n' ${scratch_dir}/vep/variants_fil_mod.vcf > ${scratch_dir}/vep/variants.table" >> aux_01_bcftools_query.sh
 echo "sed -i -r 's/(#|\[[0-9]+\])//g' ./vep/variants.table;sed -i 's/:/_/g' ./vep/variants.table;sed -i 's/ //g' ./vep/variants.table;sed -i 's/\t*$//g' ./vep/variants.table " >> aux_01_bcftools_query.sh
 echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output logs/BCFTOOLSQUERY.log --job-name BCFTOOLSQUERY bash ./aux_01_bcftools_query.sh &" > _01_run_bcftools_query.sh
 
@@ -31,7 +31,7 @@ echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output
 
 # Run Vep without the plugin columns
 
-echo "srun --partition short_idx --mem 100G --time 12:00:00 --chdir ${scratch_dir} --output logs/VEP.log --job-name VEP singularity exec -B /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/ -B /data/bi/references/eukaria/homo_sapiens/cache_vep/ -B ${scratch_dir}/../../../ /data/bi/pipelines/singularity-images/ensembl-vep:103.1--pl5262h4a94de4_2 vep --fasta /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta -i ${scratch_dir}/vep/variants_fil_mod.vcf -o ${scratch_dir}/vep/vep_annot.vcf --cache --offline --dir_cache /data/bi/references/eukaria/homo_sapiens/cache_vep/ --everything --assembly GRCh37 --tab &" > _02_vep_annotation.sh
+echo "srun --partition short_idx --mem 100G --time 12:00:00 --chdir ${scratch_dir} --output logs/VEP.log --job-name VEP singularity exec -B /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/ -B /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/ -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/ensembl-vep:103.1--pl5262h4a94de4_2 vep --fasta /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37.fasta -i ${scratch_dir}/vep/variants_fil_mod.vcf -o ${scratch_dir}/vep/vep_annot.vcf --cache --offline --dir_cache /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/ --everything --assembly GRCh37 --tab &" > _02_vep_annotation.sh
 
 #--------------------------------------------------------------------------------------------------------------------
 
@@ -74,7 +74,7 @@ sed -i "s|PROBAND|${proband}|g" ./exomiser_configfile.yml
 sed -i "s|OUTPUT_FOLDER|${output_folder}|g" ./exomiser_configfile.yml
 
 echo "java -Xms300g -Xmx300g -jar exomiser-cli-13.0.0.jar --analysis ${scratch_dir}/exomiser_configfile.yml; rm /tmp/spring.log" > aux1_04_exomiser_ALL.sh
-echo "srun --partition short_idx --mem 350G --time 12:00:00 --chdir /data/bi/pipelines/exomiser/exomiser-cli-13.0.0 --output logs/EXOMISER.log --job-name EXOMISER bash ${scratch_dir}/aux1_04_exomiser_ALL.sh &" > _04_exomiser_ALL.sh
+echo "srun --partition short_idx --mem 350G --time 12:00:00 --chdir /data/ucct/bi/pipelines/exomiser/exomiser-cli-13.0.0 --output logs/EXOMISER.log --job-name EXOMISER bash ${scratch_dir}/aux1_04_exomiser_ALL.sh &" > _04_exomiser_ALL.sh
 
 ## 8. Running exomiser_exome
 
@@ -91,7 +91,7 @@ sed -i "s|BED_FILE|${bed_file}|g" ./exomiser_configfile_exome.yml
 sed -i "s|OUTPUT_FOLDER|${output_folder}|g" ./exomiser_configfile_exome.yml
 
 echo "java -Xms300g -Xmx300g -jar exomiser-cli-13.0.0.jar --analysis ${scratch_dir}/exomiser_configfile_exome.yml; rm /tmp/spring.log" > aux2_04_exomiser_exome.sh
-echo "srun --partition short_idx --mem 350G --time 12:00:00 --chdir /data/bi/pipelines/exomiser/exomiser-cli-13.0.0 --output logs/EXOMISER_exome.log --job-name EXOMISER bash ${scratch_dir}/aux2_04_exomiser_exome.sh &" >> _04_exomiser_ALL.sh
+echo "srun --partition short_idx --mem 350G --time 12:00:00 --chdir /data/ucct/bi/pipelines/exomiser/exomiser-cli-13.0.0 --output logs/EXOMISER_exome.log --job-name EXOMISER bash ${scratch_dir}/aux2_04_exomiser_exome.sh &" >> _04_exomiser_ALL.sh
 
 ## 9. Running exomiser_genes
 
@@ -108,7 +108,7 @@ sed -i "s|BED_FILE|${bed_file}|g" ./exomiser_configfile_genes.yml
 sed -i "s|OUTPUT_FOLDER|${output_folder}|g" ./exomiser_configfile_genes.yml
 
 echo "java -Xms300g -Xmx300g -jar exomiser-cli-13.0.0.jar --analysis ${scratch_dir}/exomiser_configfile_genes.yml; rm /tmp/spring.log" > aux3_04_exomiser_genes.sh
-echo "srun --partition short_idx --mem 350G --time 12:00:00 --chdir /data/bi/pipelines/exomiser/exomiser-cli-13.0.0 --output logs/EXOMISER_genes.log --job-name EXOMISER bash ${scratch_dir}/aux3_04_exomiser_genes.sh &" >> _04_exomiser_ALL.sh
+echo "srun --partition short_idx --mem 350G --time 12:00:00 --chdir /data/ucct/bi/pipelines/exomiser/exomiser-cli-13.0.0 --output logs/EXOMISER_genes.log --job-name EXOMISER bash ${scratch_dir}/aux3_04_exomiser_genes.sh &" >> _04_exomiser_ALL.sh
 
 #--------------------------------------------------------------------------------------------------------
 
diff --git a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/99-stats/lablog b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/99-stats/lablog
index cd02372f7..08dc70415 100644
--- a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/99-stats/lablog
+++ b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/99-stats/lablog
@@ -3,7 +3,7 @@
 scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
 mkdir logs
 
-cat ../samples_id.txt | xargs -I @@ echo "srun --partition short_idx --mem 100G --time 2:00:00 --chdir ${scratch_dir} --output logs/PICARDHSMETRICS.@@.%j.log --job-name PICARDHSMETRICS singularity exec -B ${scratch_dir}/../../../ -B /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/ /data/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectHsMetrics -R /data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37_decoy.fasta -BI ${scratch_dir}/../../../REFERENCES/exomiser_exome_mod.interval_list -TI ${scratch_dir}/../../../REFERENCES/exomiser_exome_mod.interval_list -I ${scratch_dir}/../01-sarek/preprocessing/recalibrated/@@/@@.recal.cram -O ${scratch_dir}/@@_hsMetrics.out -VALIDATION_STRINGENCY LENIENT &" > _01_picardHsMetrics.sh
+cat ../samples_id.txt | xargs -I @@ echo "srun --partition short_idx --mem 100G --time 2:00:00 --chdir ${scratch_dir} --output logs/PICARDHSMETRICS.@@.%j.log --job-name PICARDHSMETRICS singularity exec -B ${scratch_dir}/../../../ -B /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/ /data/ucct/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectHsMetrics -R /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37_decoy.fasta -BI ${scratch_dir}/../../../REFERENCES/exomiser_exome_mod.interval_list -TI ${scratch_dir}/../../../REFERENCES/exomiser_exome_mod.interval_list -I ${scratch_dir}/../01-sarek/preprocessing/recalibrated/@@/@@.recal.cram -O ${scratch_dir}/@@_hsMetrics.out -VALIDATION_STRINGENCY LENIENT &" > _01_picardHsMetrics.sh
 
 echo "echo "\"SAMPLE\",\"MEAN TARGET COVERAGE\", \"PCT USABLE BASES ON TARGET\",\"FOLD ENRICHMENT\",\"PCT TARGET BASES 10X\",\"PCT TARGET BASES 20X\",\"PCT TARGET BASES 30X\",\"PCT TARGET BASES 40X\",\"PCT TARGET BASES 50X\"" > hsMetrics_all.out" > _02_hsMetrics_all.sh
 cat ../samples_id.txt | xargs -I % echo "grep '^exomiser' %_hsMetrics.out | awk 'BEGIN{FS=\"\\t\";OFS=\",\"}{print \"%\",\$34,\$12,\$13,\$48,\$49,\$50,\$51,\$52}' >> hsMetrics_all.out" >> _02_hsMetrics_all.sh
diff --git a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/lablog b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/lablog
index 14528c4fd..7fbc9ebfd 100755
--- a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/lablog
+++ b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/lablog
@@ -44,15 +44,15 @@ cat <<EOF > sarek.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/nf-core-sarek/nf-core-sarek_3.4.4/3_4_4/main.nf \\
+nextflow run /data/ucct/bi/pipelines/nf-core-sarek/nf-core-sarek_3.4.4/3_4_4/main.nf \\
           -c ../../DOC/hpc_slurm_sarek.config \\
           --input 'samplesheet.csv' \\
           --outdir 01-sarek \\
           --genome GATK.GRCh37 \\
-          --dbsnp '/data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/variants/20131208/dbsnp_138_mod.b37.vcf.gz' \\
-              --dbsnp_tbi '/data/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/variants/20131208/dbsnp_138_mod.b37.vcf.gz.tbi' \\
+          --dbsnp '/data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/variants/20131208/dbsnp_138_mod.b37.vcf.gz' \\
+              --dbsnp_tbi '/data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/variants/20131208/dbsnp_138_mod.b37.vcf.gz.tbi' \\
               --igenomes_ignore \\
-              --igenomes_base '/data/bi/references/igenomes/' \\
+              --igenomes_base '/data/ucct/bi/references/igenomes/' \\
               --tools 'haplotypecaller' \\
           --joint_germline \\
                   -resume
diff --git a/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/assembly.sbatch b/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/assembly.sbatch
index 4ca6d581d..c04c01e8c 100644
--- a/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/assembly.sbatch
+++ b/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/assembly.sbatch
@@ -18,6 +18,6 @@ nextflow run /scratch/bi/pipelines/BU_ISCIII-bacterial-assembly/main.nf \
           --gram + \
           --reference_outdir ../../REFERENCES \
 	  --save_trimmed false \
-          --kmerfinder_bacteria_database '/data/bi/references/kmerfinder/20190108_stable_dirs/bacteria' \
-          --reference_ncbi_bacteria '/data/bi/references/bacteria/latest_db/assembly_summary_bacteria.txt' \
+          --kmerfinder_bacteria_database '/data/ucct/bi/references/kmerfinder/20190108_stable_dirs/bacteria' \
+          --reference_ncbi_bacteria '/data/ucct/bi/references/bacteria/latest_db/assembly_summary_bacteria.txt' \
           -resume
diff --git a/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog b/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog
index f74930016..0de333a1d 100644
--- a/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog
+++ b/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog
@@ -38,8 +38,8 @@ nextflow run /scratch/bi/pipelines/BU_ISCIII-bacterial-assembly/main.nf \\
           --gram ${1} \\
           --reference_outdir ../../REFERENCES \\
 	  --save_trimmed false \\
-          --kmerfinder_bacteria_database '/data/bi/references/kmerfinder/20190108_stable_dirs/bacteria' \\
-          --reference_ncbi_bacteria '/data/bi/references/bacteria/latest_db/assembly_summary_bacteria.txt' \\
+          --kmerfinder_bacteria_database '/data/ucct/bi/references/kmerfinder/20190108_stable_dirs/bacteria' \\
+          --reference_ncbi_bacteria '/data/ucct/bi/references/bacteria/latest_db/assembly_summary_bacteria.txt' \\
           -resume
 EOF
 
diff --git a/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/_01_copy_folder.sh b/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/_01_copy_folder.sh
index 4bc3d1ccf..d02cd58b1 100644
--- a/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/_01_copy_folder.sh
+++ b/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/_01_copy_folder.sh
@@ -1 +1 @@
-srun --partition short_idx rsync -rlv /data/bi/scratch_tmp/bi/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS /scratch/bi
+srun --partition short_idx rsync -rlv /data/ucct/bi/scratch_tmp/bi/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS /scratch/bi
diff --git a/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/_02_copy_back.sh b/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/_02_copy_back.sh
index 5907e65b6..cd43a6ec8 100644
--- a/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/_02_copy_back.sh
+++ b/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/_02_copy_back.sh
@@ -1 +1 @@
-srun --partition short_idx rsync -rlv --exclude "work" /scratch/bi/ANALYSIS/* /data/bi/scratch_tmp/bi/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/
+srun --partition short_idx rsync -rlv --exclude "work" /scratch/bi/ANALYSIS/* /data/ucct/bi/scratch_tmp/bi/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/
diff --git a/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/DOC/hpc_slurm_assembly.config b/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/DOC/hpc_slurm_assembly.config
index 73bfc79ba..69cedf4b8 100644
--- a/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/DOC/hpc_slurm_assembly.config
+++ b/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/DOC/hpc_slurm_assembly.config
@@ -11,7 +11,7 @@ singularity {
 process {
 	executor = 'slurm'
 	queue = 'middle_idx'
-        conda = '/data/bi/pipelines/miniconda3/envs/assembly'
+        conda = '/data/ucct/bi/pipelines/miniconda3/envs/assembly'
         errorStrategy = { task.exitStatus in [140,143,137,138,104,134,139] ? 'retry' : 'finish'; task.exitStatus in [1,4,255] ? 'ignore' : 'finish' }
         maxRetries = 1
         maxErrors = '-1'
diff --git a/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/assembly.sbatch b/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/assembly.sbatch
index 4ca6d581d..c04c01e8c 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/assembly.sbatch
+++ b/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/assembly.sbatch
@@ -18,6 +18,6 @@ nextflow run /scratch/bi/pipelines/BU_ISCIII-bacterial-assembly/main.nf \
           --gram + \
           --reference_outdir ../../REFERENCES \
 	  --save_trimmed false \
-          --kmerfinder_bacteria_database '/data/bi/references/kmerfinder/20190108_stable_dirs/bacteria' \
-          --reference_ncbi_bacteria '/data/bi/references/bacteria/latest_db/assembly_summary_bacteria.txt' \
+          --kmerfinder_bacteria_database '/data/ucct/bi/references/kmerfinder/20190108_stable_dirs/bacteria' \
+          --reference_ncbi_bacteria '/data/ucct/bi/references/bacteria/latest_db/assembly_summary_bacteria.txt' \
           -resume
diff --git a/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog b/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog
index f74930016..0de333a1d 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog
+++ b/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog
@@ -38,8 +38,8 @@ nextflow run /scratch/bi/pipelines/BU_ISCIII-bacterial-assembly/main.nf \\
           --gram ${1} \\
           --reference_outdir ../../REFERENCES \\
 	  --save_trimmed false \\
-          --kmerfinder_bacteria_database '/data/bi/references/kmerfinder/20190108_stable_dirs/bacteria' \\
-          --reference_ncbi_bacteria '/data/bi/references/bacteria/latest_db/assembly_summary_bacteria.txt' \\
+          --kmerfinder_bacteria_database '/data/ucct/bi/references/kmerfinder/20190108_stable_dirs/bacteria' \\
+          --reference_ncbi_bacteria '/data/ucct/bi/references/bacteria/latest_db/assembly_summary_bacteria.txt' \\
           -resume
 EOF
 
diff --git a/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/_01_copy_folder.sh b/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/_01_copy_folder.sh
index 4bc3d1ccf..d02cd58b1 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/_01_copy_folder.sh
+++ b/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/_01_copy_folder.sh
@@ -1 +1 @@
-srun --partition short_idx rsync -rlv /data/bi/scratch_tmp/bi/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS /scratch/bi
+srun --partition short_idx rsync -rlv /data/ucct/bi/scratch_tmp/bi/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS /scratch/bi
diff --git a/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/_02_copy_back.sh b/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/_02_copy_back.sh
index 5907e65b6..cd43a6ec8 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/_02_copy_back.sh
+++ b/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/_02_copy_back.sh
@@ -1 +1 @@
-srun --partition short_idx rsync -rlv --exclude "work" /scratch/bi/ANALYSIS/* /data/bi/scratch_tmp/bi/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/
+srun --partition short_idx rsync -rlv --exclude "work" /scratch/bi/ANALYSIS/* /data/ucct/bi/scratch_tmp/bi/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/
diff --git a/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/DOC/hpc_slurm_assembly.config b/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/DOC/hpc_slurm_assembly.config
index 73bfc79ba..69cedf4b8 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/DOC/hpc_slurm_assembly.config
+++ b/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/DOC/hpc_slurm_assembly.config
@@ -11,7 +11,7 @@ singularity {
 process {
 	executor = 'slurm'
 	queue = 'middle_idx'
-        conda = '/data/bi/pipelines/miniconda3/envs/assembly'
+        conda = '/data/ucct/bi/pipelines/miniconda3/envs/assembly'
         errorStrategy = { task.exitStatus in [140,143,137,138,104,134,139] ? 'retry' : 'finish'; task.exitStatus in [1,4,255] ? 'ignore' : 'finish' }
         maxRetries = 1
         maxErrors = '-1'
diff --git a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS02_METAGENOMIC_HUMAN/RotavirusA_11segments_viralrecon.sbatch b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS02_METAGENOMIC_HUMAN/RotavirusA_11segments_viralrecon.sbatch
index 4be9b8f0e..547ffece1 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS02_METAGENOMIC_HUMAN/RotavirusA_11segments_viralrecon.sbatch
+++ b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS02_METAGENOMIC_HUMAN/RotavirusA_11segments_viralrecon.sbatch
@@ -13,11 +13,11 @@ nextflow run /scratch/bi/pipelines/nf-core-viralrecon-2.5/workflow/main.nf \
           -c ./viralrecon_metagenomic.config \
           --input samplesheet_RotavirusA_11segments.csv \
           --outdir RotavirusA_11segments_20221205_viralrecon_mapping \
-          --fasta /data/bi/references/virus/reoviridae/RotavirusA_11segments.fasta \
-          --gff /data/bi/references/virus/reoviridae/RotavirusA_11segments.gff \
+          --fasta /data/ucct/bi/references/virus/reoviridae/RotavirusA_11segments.fasta \
+          --gff /data/ucct/bi/references/virus/reoviridae/RotavirusA_11segments.gff \
           --platform illumina \
           --protocol metagenomic \
-          --kraken2_db "/data/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz" \
+          --kraken2_db "/data/ucct/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz" \
           --variant_caller ivar \
           --consensus_caller bcftools \
           --skip_pangolin \
diff --git a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS02_METAGENOMIC_HUMAN/lablog b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS02_METAGENOMIC_HUMAN/lablog
index 17238c490..4bb83f62c 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS02_METAGENOMIC_HUMAN/lablog
+++ b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS02_METAGENOMIC_HUMAN/lablog
@@ -21,11 +21,11 @@ nextflow run /scratch/bi/pipelines/nf-core-viralrecon-2.5/workflow/main.nf \\
           -c ./viralrecon_metagenomic.config \\
           --input samplesheet_RotavirusA_11segments.csv \\
           --outdir RotavirusA_11segments_20221205_viralrecon_mapping \\
-          --fasta /data/bi/references/virus/reoviridae/RotavirusA_11segments.fasta \\
-          --gff /data/bi/references/virus/reoviridae/RotavirusA_11segments.gff \\
+          --fasta /data/ucct/bi/references/virus/reoviridae/RotavirusA_11segments.fasta \\
+          --gff /data/ucct/bi/references/virus/reoviridae/RotavirusA_11segments.gff \\
           --platform illumina \\
           --protocol metagenomic \\
-          --kraken2_db "/data/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz" \\
+          --kraken2_db "/data/ucct/bi/references/eukaria/homo_sapiens/hg38/UCSC/kraken2/kraken2_human.tar.gz" \\
           --variant_caller ivar \\
           --consensus_caller bcftools \\
           --skip_pangolin \\
diff --git a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS03_MAG/lablog b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS03_MAG/lablog
index 82cbd485e..78abe5121 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS03_MAG/lablog
+++ b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS03_MAG/lablog
@@ -17,11 +17,11 @@ cat <<EOF > mag.sbatch
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/nf-core-mag-2.1.1/workflow/main.nf \\
+nextflow run /data/ucct/bi/pipelines/nf-core-mag-2.1.1/workflow/main.nf \\
           -c ../../DOC/mag.config \\
           --input '00-reads/*_R{1,2}.fastq.gz' \\
           --outdir $(date '+%Y%m%d')_mag \\
-          --kraken2_db /data/bi/references/kraken/minikraken_8GB_20200312.tgz \\
+          --kraken2_db /data/ucct/bi/references/kraken/minikraken_8GB_20200312.tgz \\
           --skip_busco --skip_spades --skip_spadeshybrid --skip_megahit --skip_prodigal --skip_binning \\
           -resume
 EOF
diff --git a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS03_MAG/mag.sbatch b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS03_MAG/mag.sbatch
index 342d6cf27..814731ef0 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS03_MAG/mag.sbatch
+++ b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS03_MAG/mag.sbatch
@@ -9,10 +9,10 @@
 
 export NXF_OPTS="-Xms500M -Xmx4G"
 
-nextflow run /data/bi/pipelines/nf-core-mag-2.1.1/workflow/main.nf \
+nextflow run /data/ucct/bi/pipelines/nf-core-mag-2.1.1/workflow/main.nf \
           -c ../../DOC/mag.config \
           --input '00-reads/*_R{1,2}.fastq.gz' \
           --outdir 20221205_mag \
-          --kraken2_db /data/bi/references/kraken/minikraken_8GB_20200312.tgz \
+          --kraken2_db /data/ucct/bi/references/kraken/minikraken_8GB_20200312.tgz \
           --skip_busco --skip_spades --skip_spadeshybrid --skip_megahit --skip_prodigal --skip_binning \
           -resume
diff --git a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST/_02_blast.sh b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST/_02_blast.sh
index 09b18816a..a0f870a69 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST/_02_blast.sh
+++ b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST/_02_blast.sh
@@ -1,7 +1,7 @@
-srun --chdir /scratch/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_PTA201_%j.log --job-name blastn_PTA201 blastn -num_threads 10 -db /data/bi/references/virus/BLAST/all_virus.fasta -query ./PTA201.scaffolds.fa -out PTA201.blast.txt -outfmt '6 stitle std slen qlen qcovs' &
-srun --chdir /scratch/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_PTA203_%j.log --job-name blastn_PTA203 blastn -num_threads 10 -db /data/bi/references/virus/BLAST/all_virus.fasta -query ./PTA203.scaffolds.fa -out PTA203.blast.txt -outfmt '6 stitle std slen qlen qcovs' &
-srun --chdir /scratch/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_PTA205_%j.log --job-name blastn_PTA205 blastn -num_threads 10 -db /data/bi/references/virus/BLAST/all_virus.fasta -query ./PTA205.scaffolds.fa -out PTA205.blast.txt -outfmt '6 stitle std slen qlen qcovs' &
-srun --chdir /scratch/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_PTA200_%j.log --job-name blastn_PTA200 blastn -num_threads 10 -db /data/bi/references/virus/BLAST/all_virus.fasta -query ./PTA200.scaffolds.fa -out PTA200.blast.txt -outfmt '6 stitle std slen qlen qcovs' &
-srun --chdir /scratch/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_PTA202_%j.log --job-name blastn_PTA202 blastn -num_threads 10 -db /data/bi/references/virus/BLAST/all_virus.fasta -query ./PTA202.scaffolds.fa -out PTA202.blast.txt -outfmt '6 stitle std slen qlen qcovs' &
-srun --chdir /scratch/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_PTA204_%j.log --job-name blastn_PTA204 blastn -num_threads 10 -db /data/bi/references/virus/BLAST/all_virus.fasta -query ./PTA204.scaffolds.fa -out PTA204.blast.txt -outfmt '6 stitle std slen qlen qcovs' &
-srun --chdir /scratch/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_PTA206_%j.log --job-name blastn_PTA206 blastn -num_threads 10 -db /data/bi/references/virus/BLAST/all_virus.fasta -query ./PTA206.scaffolds.fa -out PTA206.blast.txt -outfmt '6 stitle std slen qlen qcovs' &
+srun --chdir /scratch/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_PTA201_%j.log --job-name blastn_PTA201 blastn -num_threads 10 -db /data/ucct/bi/references/virus/BLAST/all_virus.fasta -query ./PTA201.scaffolds.fa -out PTA201.blast.txt -outfmt '6 stitle std slen qlen qcovs' &
+srun --chdir /scratch/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_PTA203_%j.log --job-name blastn_PTA203 blastn -num_threads 10 -db /data/ucct/bi/references/virus/BLAST/all_virus.fasta -query ./PTA203.scaffolds.fa -out PTA203.blast.txt -outfmt '6 stitle std slen qlen qcovs' &
+srun --chdir /scratch/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_PTA205_%j.log --job-name blastn_PTA205 blastn -num_threads 10 -db /data/ucct/bi/references/virus/BLAST/all_virus.fasta -query ./PTA205.scaffolds.fa -out PTA205.blast.txt -outfmt '6 stitle std slen qlen qcovs' &
+srun --chdir /scratch/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_PTA200_%j.log --job-name blastn_PTA200 blastn -num_threads 10 -db /data/ucct/bi/references/virus/BLAST/all_virus.fasta -query ./PTA200.scaffolds.fa -out PTA200.blast.txt -outfmt '6 stitle std slen qlen qcovs' &
+srun --chdir /scratch/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_PTA202_%j.log --job-name blastn_PTA202 blastn -num_threads 10 -db /data/ucct/bi/references/virus/BLAST/all_virus.fasta -query ./PTA202.scaffolds.fa -out PTA202.blast.txt -outfmt '6 stitle std slen qlen qcovs' &
+srun --chdir /scratch/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_PTA204_%j.log --job-name blastn_PTA204 blastn -num_threads 10 -db /data/ucct/bi/references/virus/BLAST/all_virus.fasta -query ./PTA204.scaffolds.fa -out PTA204.blast.txt -outfmt '6 stitle std slen qlen qcovs' &
+srun --chdir /scratch/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_PTA206_%j.log --job-name blastn_PTA206 blastn -num_threads 10 -db /data/ucct/bi/references/virus/BLAST/all_virus.fasta -query ./PTA206.scaffolds.fa -out PTA206.blast.txt -outfmt '6 stitle std slen qlen qcovs' &
diff --git a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST/lablog b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST/lablog
index f0d95849d..2d817bebc 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST/lablog
+++ b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST/lablog
@@ -5,7 +5,7 @@ mkdir logs
 
 cat ../samples_id.txt | while read in; do cp ../*/*/assembly/*/*/${in}.scaffolds.fa.gz .; done 
 echo "gunzip *.gz" > _01_gunzip.sh
-cat ../samples_id.txt | while read in; do echo "srun --chdir ${scratch_dir} --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_${in}_%j.log --job-name blastn_${in} blastn -num_threads 10 -db /data/bi/references/virus/BLAST/all_virus.fasta -query ./${in}.scaffolds.fa -out ${in}.blast.txt -outfmt '6 stitle std slen qlen qcovs' &"; done > _02_blast.sh
+cat ../samples_id.txt | while read in; do echo "srun --chdir ${scratch_dir} --partition middle_idx --mem 376530M --time 48:00:00 --cpus-per-task 10 --output logs/blastn_${in}_%j.log --job-name blastn_${in} blastn -num_threads 10 -db /data/ucct/bi/references/virus/BLAST/all_virus.fasta -query ./${in}.scaffolds.fa -out ${in}.blast.txt -outfmt '6 stitle std slen qlen qcovs' &"; done > _02_blast.sh
 cat ../samples_id.txt | while read in; do echo "awk 'BEGIN{OFS=\"\t\";FS=\"\t\"}{print \$0,\$5/\$15,\$5/\$14}' ${in}.blast.txt | awk 'BEGIN{OFS=\"\t\";FS=\"\t\"} \$15 > 200 && \$17 > 0.7 && \$1 !~ /phage/ {print \$0}' > ${in}.blast.filt.txt"; done > _03_filt_blast.sh
 echo "stitle	qaccver	saccver	pident	length	mismatch	gapopen	qstart	qend	sstart	send	evalue	bitscore	slen	qlen	qcovs	%cgAligned	%refCovered" > header
 cat ../samples_id.txt | while read in; do echo "cat header ${in}.blast.filt.txt > ${in}.blast.filt.header.txt";done > _04_header.sh
diff --git a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/_01_copy_folder.sh b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/_01_copy_folder.sh
index 36f7b4771..180692fc4 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/_01_copy_folder.sh
+++ b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/_01_copy_folder.sh
@@ -1 +1 @@
-srun --partition short_idx rsync -rlv /data/bi/scratch_tmp/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS /scratch/bi
+srun --partition short_idx rsync -rlv /data/ucct/bi/scratch_tmp/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS /scratch/bi
diff --git a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/_02_copy_back.sh b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/_02_copy_back.sh
index f9d00e93f..c0a790cb0 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/_02_copy_back.sh
+++ b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/_02_copy_back.sh
@@ -1 +1 @@
-srun --partition short_idx rsync -rlv --exclude "work" /scratch/bi/ANALYSIS/* /data/bi/scratch_tmp/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/
+srun --partition short_idx rsync -rlv --exclude "work" /scratch/bi/ANALYSIS/* /data/ucct/bi/scratch_tmp/bi/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/
diff --git a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/lablog b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/lablog
index 1ee3445a0..0fc44fd73 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/lablog
+++ b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/lablog
@@ -24,8 +24,8 @@ do
         do
             arr=($samples); echo "${arr[0]},00-reads/${arr[0]}_R1.fastq.gz,00-reads/${arr[0]}_R2.fastq.gz" >> ${FOLDER_NAME}/samplesheet_${ref}.csv
         done
-        REF_FASTA=$(find /data/bi/references/virus/ -name ${ref}.fasta)
-        REF_GFF=$(find /data/bi/references/virus/ -name ${ref}.gff)
+        REF_FASTA=$(find /data/ucct/bi/references/virus/ -name ${ref}.fasta)
+        REF_GFF=$(find /data/ucct/bi/references/virus/ -name ${ref}.gff)
         echo "cat <<EOF > ${ref}_viralrecon.sbatch" >> ${FOLDER_NAME}/lablog
         echo "#!/bin/sh" >> ${FOLDER_NAME}/lablog
         echo "#SBATCH --ntasks 1" >> ${FOLDER_NAME}/lablog
diff --git a/tests/data/bi/services_and_colaborations/CNM/bacteriology/SRVCNM983_20240228_TEST001_bioinfoadm_S/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog b/tests/data/bi/services_and_colaborations/CNM/bacteriology/SRVCNM983_20240228_TEST001_bioinfoadm_S/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
index bd8f8549a..f96f271b0 100644
--- a/tests/data/bi/services_and_colaborations/CNM/bacteriology/SRVCNM983_20240228_TEST001_bioinfoadm_S/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
+++ b/tests/data/bi/services_and_colaborations/CNM/bacteriology/SRVCNM983_20240228_TEST001_bioinfoadm_S/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
@@ -107,7 +107,7 @@ cat <<EOF > assembly.sbatch
 # module load Nextflow/23.10.0 singularity
 export NXF_OPTS="-Xms500M -Xmx8G"
 
-nextflow run /data/bi/pipelines/nf-core-bacass/main.nf \\
+nextflow run /data/ucct/bi/pipelines/nf-core-bacass/main.nf \\
         -c ../../DOC/hpc_slurm_assembly.config \\
         -profile singularity \\
         --input samplesheet.csv \\
@@ -119,8 +119,8 @@ nextflow run /data/bi/pipelines/nf-core-bacass/main.nf \\
         --fastp_args '--qualified_quality_phred 20 --cut_mean_quality 20' \\
         --skip_kraken2 true \\
         --skip_kmerfinder false \\
-        --kmerfinderdb /data/bi/references/kmerfinder/20190108_stable_dirs/bacteria \\
-        --ncbi_assembly_metadata /data/bi/references/bacteria/20191212/assembly_summary_bacteria.txt \\
+        --kmerfinderdb /data/ucct/bi/references/kmerfinder/20190108_stable_dirs/bacteria \\
+        --ncbi_assembly_metadata /data/ucct/bi/references/bacteria/20191212/assembly_summary_bacteria.txt \\
         ${PROKKA_ARGS} \\
         -resume
 
diff --git a/tests/data/bi/services_and_colaborations/CNM/bacteriology/SRVCNM983_20240228_TEST001_bioinfoadm_S/DOC/hpc_slurm_assembly.config b/tests/data/bi/services_and_colaborations/CNM/bacteriology/SRVCNM983_20240228_TEST001_bioinfoadm_S/DOC/hpc_slurm_assembly.config
index 04dddf4db..648cacfea 100644
--- a/tests/data/bi/services_and_colaborations/CNM/bacteriology/SRVCNM983_20240228_TEST001_bioinfoadm_S/DOC/hpc_slurm_assembly.config
+++ b/tests/data/bi/services_and_colaborations/CNM/bacteriology/SRVCNM983_20240228_TEST001_bioinfoadm_S/DOC/hpc_slurm_assembly.config
@@ -5,7 +5,7 @@
 singularity {
         enabled                 = true
         autoMounts              = true
-        singularity.cacheDir    = '/data/bi/pipelines/singularity-images'
+        singularity.cacheDir    = '/data/ucct/bi/pipelines/singularity-images'
 }
 
 process {
diff --git a/tests/data/bi/sftp/Labbacteriavac/SRVCNM983_20240228_TEST001_bioinfoadm_S/DOC/hpc_slurm_assembly.config b/tests/data/bi/sftp/Labbacteriavac/SRVCNM983_20240228_TEST001_bioinfoadm_S/DOC/hpc_slurm_assembly.config
index 04dddf4db..648cacfea 100644
--- a/tests/data/bi/sftp/Labbacteriavac/SRVCNM983_20240228_TEST001_bioinfoadm_S/DOC/hpc_slurm_assembly.config
+++ b/tests/data/bi/sftp/Labbacteriavac/SRVCNM983_20240228_TEST001_bioinfoadm_S/DOC/hpc_slurm_assembly.config
@@ -5,7 +5,7 @@
 singularity {
         enabled                 = true
         autoMounts              = true
-        singularity.cacheDir    = '/data/bi/pipelines/singularity-images'
+        singularity.cacheDir    = '/data/ucct/bi/pipelines/singularity-images'
 }
 
 process {
diff --git a/tests/data/bi/sftp/test/SRVCNM983_20240228_TEST001_bioinfoadm_S/DOC/hpc_slurm_assembly.config b/tests/data/bi/sftp/test/SRVCNM983_20240228_TEST001_bioinfoadm_S/DOC/hpc_slurm_assembly.config
index 04dddf4db..648cacfea 100644
--- a/tests/data/bi/sftp/test/SRVCNM983_20240228_TEST001_bioinfoadm_S/DOC/hpc_slurm_assembly.config
+++ b/tests/data/bi/sftp/test/SRVCNM983_20240228_TEST001_bioinfoadm_S/DOC/hpc_slurm_assembly.config
@@ -5,7 +5,7 @@
 singularity {
         enabled                 = true
         autoMounts              = true
-        singularity.cacheDir    = '/data/bi/pipelines/singularity-images'
+        singularity.cacheDir    = '/data/ucct/bi/pipelines/singularity-images'
 }
 
 process {

From 82667f3364a3a01e97fb6afa5e1f6b754adb0485 Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Mon, 23 Dec 2024 13:19:12 +0100
Subject: [PATCH 314/321] Updated CHANGELOG.md, setup.py and __main__.py for
 the new release

---
 CHANGELOG.md          | 27 ++++++++++++++++++++++++++-
 bu_isciii/__main__.py |  2 +-
 setup.py              |  2 +-
 3 files changed, 28 insertions(+), 3 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 8b1f277db..154251f8e 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -4,7 +4,27 @@ All notable changes to this project will be documented in this file.
 
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/), and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
-## [2.X.Xdev] - 2024-0X-XX : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.X.X
+## [2.X.Xhot] - 2024-0X-0X : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.X.3
+
+### Credits
+
+Code contributions to the hotfix:
+
+### Template fixes and updates
+
+### Modules
+
+#### Added enhancements
+
+#### Fixes
+
+#### Changed
+
+#### Removed
+
+### Requirements
+
+## [2.2.3] - 2024-12-23 : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.2.3
 
 ### Credits
 
@@ -16,6 +36,11 @@ Code contributions to the new version:
 ### Template fixes and updates
 
 - Updated sftp_user.json, added the locus-tag option for the PROKKA process in the bacass config file and changed new_service.py so that integrity is checked only for the samples of interest [#363](https://github.com/BU-ISCIII/buisciii-tools/pull/363).
+- Replaced /data/bi/ by /data/ucct/bi/ [#380](https://github.com/BU-ISCIII/buisciii-tools/pull/380).
+- Updated bacass version in all pertinent files [#380](https://github.com/BU-ISCIII/buisciii-tools/pull/380).
+- Updated read length variable definition when creating the mapping_illumina.tab file [#380](https://github.com/BU-ISCIII/buisciii-tools/pull/380).
+- Updated create_irma_stats.sh to include %mapped_reads [#380](https://github.com/BU-ISCIII/buisciii-tools/pull/380).
+- Changed "Buenas" by "Estimado/a" in email.j2 [#380](https://github.com/BU-ISCIII/buisciii-tools/pull/380).
 
 ### Modules
 
diff --git a/bu_isciii/__main__.py b/bu_isciii/__main__.py
index 3befb9eec..283f797c7 100755
--- a/bu_isciii/__main__.py
+++ b/bu_isciii/__main__.py
@@ -57,7 +57,7 @@ def run_bu_isciii():
     )
 
     # stderr.print("[green]                                          `._,._,'\n", highlight=False)
-    __version__ = "2.2.2"
+    __version__ = "2.2.3"
     stderr.print(
         "[grey39]    BU-ISCIII-tools version {}".format(__version__), highlight=False
     )
diff --git a/setup.py b/setup.py
index 679386268..5e35992b5 100755
--- a/setup.py
+++ b/setup.py
@@ -2,7 +2,7 @@
 
 from setuptools import setup, find_packages
 
-version = "2.2.2"
+version = "2.2.3"
 
 with open("README.md") as f:
     readme = f.read()

From 5a33367fd7855baeb35faf4e6015819d6c6c17af Mon Sep 17 00:00:00 2001
From: "github-actions[bot]"
 <41898282+github-actions[bot]@users.noreply.github.com>
Date: Mon, 23 Dec 2024 15:34:40 +0100
Subject: [PATCH 315/321] Merge changes from main into hotfix (#195) (#382)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com>
Co-authored-by: Sara Monzón <sara.monzon.fdz@gmail.com>
Co-authored-by: Pablo Mata <76519482+Shettland@users.noreply.github.com>
Co-authored-by: Víctor López <98259577+victor5lm@users.noreply.github.com>

From a5638bfa856b8505c0e57325e246ca7ee876a7ad Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 24 Dec 2024 11:03:11 +0100
Subject: [PATCH 316/321] Removed middle_obx from config files

---
 bu_isciii/conf/configuration.json     | 2 +-
 bu_isciii/conf/configuration_dev.json | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/bu_isciii/conf/configuration.json b/bu_isciii/conf/configuration.json
index 123441852..95b1d9aa0 100644
--- a/bu_isciii/conf/configuration.json
+++ b/bu_isciii/conf/configuration.json
@@ -58,7 +58,7 @@
         ],
         "scratch_path": "/scratch/bi/",
         "srun_settings": {
-            "--partition": "middle_obx,middle_idx",
+            "--partition": "middle_idx",
             "--time": "24:00:00",
             "--chdir": "/scratch/bi/"
         }
diff --git a/bu_isciii/conf/configuration_dev.json b/bu_isciii/conf/configuration_dev.json
index 39d0c483a..94573b6a4 100755
--- a/bu_isciii/conf/configuration_dev.json
+++ b/bu_isciii/conf/configuration_dev.json
@@ -54,7 +54,7 @@
         ],
         "scratch_path": "tests/scratch/bi/",
         "srun_settings": {
-            "--partition": "middle_obx,middle_idx",
+            "--partition": "middle_idx",
             "--time": "24:00:00",
             "--chdir": "tests/scratch/bi/"
         }

From 344542f5aae8843fb965051808c9a13c6cf218eb Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 24 Dec 2024 11:03:28 +0100
Subject: [PATCH 317/321] Replaced /data/bi by /data/ucct/bi where necessary

---
 .../ANALYSIS01_FLU_IRMA/01-preproQC/lablog    |  2 +-
 .../ANALYSIS01_FLU_IRMA/03-procQC/lablog      |  2 +-
 .../ANALYSIS01_FLU_IRMA/04-irma/lablog        |  2 +-
 .../ANALYSIS/ANALYSIS01_ASSEMBLY/lablog       |  2 +-
 .../blast_nt/ANALYSIS/ANALYSIS02_BLAST/lablog |  2 +-
 .../02-ariba/run/lablog                       |  2 +-
 .../02-ariba/summary/lablog                   |  2 +-
 .../04-emmtyper/lablog                        |  2 +-
 .../ANALYSIS01_CHEWBBACA/02-chewbbaca/lablog  |  2 +-
 .../ANALYSIS01_EXOME/02-postprocessing/lablog |  2 +-
 .../ANALYSIS01_EXOME/03-annotation/lablog     |  6 ++---
 .../ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog |  2 +-
 .../exomeeb/ANALYSIS/ANALYSIS01_EXOME/lablog  |  2 +-
 .../ANALYSIS01_EXOME/02-postprocessing/lablog |  2 +-
 .../ANALYSIS01_EXOME/03-annotation/lablog     | 10 ++++----
 .../ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog |  2 +-
 .../ANALYSIS/ANALYSIS01_EXOME/lablog          |  2 +-
 .../ANALYSIS01_OUTBREAK/01-preproQC/lablog    |  2 +-
 .../ANALYSIS01_OUTBREAK/03-procQC/lablog      |  2 +-
 .../ANALYSIS01_OUTBREAK/04-Alignment/lablog   |  2 +-
 .../ANALYSIS01_OUTBREAK/05-mark_dups/lablog   |  2 +-
 .../ANALYSIS01_OUTBREAK/06-freebayes/lablog   |  2 +-
 .../ANALYSIS01_OUTBREAK/07-snphylo/lablog     |  2 +-
 .../ANALYSIS01_OUTBREAK/08-iqtree/lablog      |  2 +-
 .../ANALYSIS01_OUTBREAK/99-stats/lablog       |  2 +-
 .../ANALYSIS/ANALYSIS02_MET/99-stats/lablog   |  2 +-
 .../ANALYSIS/ANALYSIS02_MET/lablog            |  2 +-
 .../ANALYSIS01_RBPANEL/01-fastQC/lablog       |  2 +-
 .../ANALYSIS01_RBPANEL/03-preprocQC/lablog    |  2 +-
 .../ANALYSIS01_RBPANEL/04-mapping/lablog      |  2 +-
 .../ANALYSIS01_RBPANEL/05-samtools/lablog     |  2 +-
 .../ANALYSIS01_RBPANEL/06-VarScan/lablog      |  2 +-
 .../ANALYSIS01_RBPANEL/07-annotation/lablog   |  2 +-
 .../ANALYSIS01_RBPANEL/99-stats/lablog        |  2 +-
 .../ANALYSIS/ANALYSIS01_TAXPROFILER/lablog    |  2 +-
 .../ANALYSIS02_MAG_TAXONOMICS/99-stats/lablog |  2 +-
 .../ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog |  2 +-
 .../mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog    |  2 +-
 .../ANALYSIS01_MTBSEQ/02-kmerfinder/lablog    |  2 +-
 .../ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog      |  2 +-
 .../ANALYSIS/ANALYSIS02_PLASMIDID/lablog      |  2 +-
 .../02-differential_expression/lablog         |  2 +-
 .../ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog    |  2 +-
 .../ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog   |  2 +-
 .../ANALYSIS01_SNIPPY/01-fastqc/lablog        |  2 +-
 .../ANALYSIS01_SNIPPY/03-preprocQC/lablog     |  2 +-
 .../ANALYSIS01_SNIPPY/04-snippy/lablog        |  2 +-
 .../ANALYSIS01_SNIPPY/05-iqtree/lablog        |  2 +-
 .../ANALYSIS01_SNIPPY/99-stats/lablog         |  2 +-
 .../viralrecon/ANALYSIS/lablog_viralrecon     |  2 +-
 .../02-postprocessing/lablog                  |  2 +-
 .../ANALYSIS01_GENOME/03-annotation/lablog    | 24 +++++++++----------
 .../ANALYSIS01_GENOME/99-stats/lablog         |  2 +-
 .../wgstrio/ANALYSIS/ANALYSIS01_GENOME/lablog |  2 +-
 .../20221205_ANALYSIS01_ASSEMBLY/lablog       |  2 +-
 .../20221205_ANALYSIS01_ASSEMBLY/lablog       |  2 +-
 .../lablog                                    |  2 +-
 .../ANALYSIS/20221205_ANALYSIS03_MAG/lablog   |  2 +-
 .../ANALYSIS/20221207_ANALYSIS04_BLAST/lablog |  2 +-
 .../ANALYSIS/lablog                           |  2 +-
 .../ANALYSIS/ANALYSIS01_ASSEMBLY/lablog       |  2 +-
 61 files changed, 78 insertions(+), 78 deletions(-)

diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/01-preproQC/lablog b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/01-preproQC/lablog
index a496affd5..570ebed60 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/01-preproQC/lablog
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/01-preproQC/lablog
@@ -2,6 +2,6 @@
 
 mkdir logs
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --cpus-per-task 8 --time 01:00:00 --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../00-reads/"$in"_R1.fastq.gz ${scratch_dir}/../00-reads/"$in"_R2.fastq.gz &"; done > _01_rawfastqc.sh
diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/03-procQC/lablog b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/03-procQC/lablog
index 2bfd95ba1..686602918 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/03-procQC/lablog
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/03-procQC/lablog
@@ -2,6 +2,6 @@
 
 mkdir logs
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz &"; done > _01_rawfastqc.sh
diff --git a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
index b6196b72b..fcf827589 100644
--- a/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
+++ b/bu_isciii/templates/IRMA/ANALYSIS/ANALYSIS01_FLU_IRMA/04-irma/lablog
@@ -3,7 +3,7 @@
 
 mkdir logs
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat ../samples_id.txt | while read in; do echo "srun --partition short_idx --cpus-per-task 32 --mem 35000M --chdir $scratch_dir --time 01:00:00 --output logs/IRMA.${in}.%j.log /data/ucct/bi/pipelines/flu-amd/flu-amd-1.1.4/IRMA FLU_AD ../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz ${in} --external-config ../../../DOC/irma_config.sh &"; done > _01_irma.sh
 
diff --git a/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog b/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
index 5aa86c1a4..f9c13f25a 100644
--- a/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
+++ b/bu_isciii/templates/assembly/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
@@ -92,7 +92,7 @@ cat samples_id.txt | while read in; do
     fi
 done >> samplesheet.csv
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > assembly.sbatch
 #!/bin/sh
diff --git a/bu_isciii/templates/blast_nt/ANALYSIS/ANALYSIS02_BLAST/lablog b/bu_isciii/templates/blast_nt/ANALYSIS/ANALYSIS02_BLAST/lablog
index cf92cc65e..3f72f71c7 100644
--- a/bu_isciii/templates/blast_nt/ANALYSIS/ANALYSIS02_BLAST/lablog
+++ b/bu_isciii/templates/blast_nt/ANALYSIS/ANALYSIS02_BLAST/lablog
@@ -1,6 +1,6 @@
 # module load singularity
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 mkdir logs
 
 # Location of assemblies to a variable so it only has to be changed here
diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/run/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/run/lablog
index f31e7ae2f..36f1038a5 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/run/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/run/lablog
@@ -1,7 +1,7 @@
 # module load singularity
 
 mkdir logs
-scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
+scratch_dir=$(echo $PWD | sed 's/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g')
 downloaded_ref=$(find ../../../../REFERENCES/ -type d -name 'ref_db')
 
 # Cartesian product of the two files to avoid double looping
diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/summary/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/summary/lablog
index baf447a80..697e121c0 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/summary/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/02-ariba/summary/lablog
@@ -1,7 +1,7 @@
 # module load singularity
 
 mkdir -p logs
-scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
+scratch_dir=$(echo $PWD | sed 's/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g')
 
 # Ariba summarise data from several runs. View the results in Phandango by dragging and dropping the files out.summary.phandango.tre and out.summary.phandango.csv into the Phandago window.
 # Explanation: 
diff --git a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
index fd126538b..1e5138afe 100644
--- a/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
+++ b/bu_isciii/templates/characterization/ANALYSIS/ANALYSIS01_CHARACTERIZATION/04-emmtyper/lablog
@@ -12,7 +12,7 @@ ASSEMBLY_LIST=fasta_inputs/assembly_file_list.txt
 # Get the number of files
 num_files=$(wc -l < $ASSEMBLY_LIST)
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 # STEP 1: Set up jobarray to unzip fasta files
 cat <<EOF > _00_unzip_jobarray.sbatch
diff --git a/bu_isciii/templates/chewbbaca/ANALYSIS/ANALYSIS01_CHEWBBACA/02-chewbbaca/lablog b/bu_isciii/templates/chewbbaca/ANALYSIS/ANALYSIS01_CHEWBBACA/02-chewbbaca/lablog
index d74a4f22e..185928e92 100644
--- a/bu_isciii/templates/chewbbaca/ANALYSIS/ANALYSIS01_CHEWBBACA/02-chewbbaca/lablog
+++ b/bu_isciii/templates/chewbbaca/ANALYSIS/ANALYSIS01_CHEWBBACA/02-chewbbaca/lablog
@@ -1,4 +1,4 @@
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 # module load singularity
 
diff --git a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog
index 0c971e16e..bdb99167c 100644
--- a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog
+++ b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog
@@ -2,7 +2,7 @@
 
 # module load singularity
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 mkdir -p logs
 
diff --git a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
index 45b655319..e03a09947 100644
--- a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
+++ b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
@@ -1,7 +1,7 @@
 # module load singularity
 # module load Java/17.0.2.lua R/4.2.1
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 ln -s /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37/dbNSFP_ENSG_gene_GRCh37.txt .
 mkdir -p vep
@@ -39,9 +39,9 @@ echo "srun --partition short_idx --time 2:00:00 --chdir ${scratch_dir} --output
 echo 'grep -P "(HIGH|MODERATE)" ./variants_annot_all.tab > ./variants_annot_highModerate.tab ' > _05_conseq_filtering.sh
 
 # 9. Running exomiser
-vcf_file=$(realpath ../02-postprocessing/variants_fil.vcf | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+vcf_file=$(realpath ../02-postprocessing/variants_fil.vcf | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 proband=$(awk 'BEGIN{FS="\t"} $6 == 2 {print $2}' ../../../DOC/family.ped)
-output_folder=$(realpath ./exomiser/exomiser | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+output_folder=$(realpath ./exomiser/exomiser | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 sed -i "s|VCF_FILE|${vcf_file}|g" ./exomiser_configfile.yml
 sed -i "s|PROBAND|${proband}|g" ./exomiser_configfile.yml
diff --git a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog
index f78ff9400..55f2c56d4 100644
--- a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog
+++ b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog
@@ -1,6 +1,6 @@
 # module load singularity
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 mkdir logs
 
 cat ../samples_id.txt | xargs -I @@ echo "srun --partition short_idx --mem 100G --time 2:00:00 --chdir ${scratch_dir} --output logs/PICARDHSMETRICS.@@.%j.log --job-name PICARDHSMETRICS singularity exec -B ${scratch_dir}/../../../ -B /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome /data/ucct/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectHsMetrics -R /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37_decoy.fasta -BI ${scratch_dir}/../../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37.interval_list -TI ${scratch_dir}/../../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37.interval_list -I ${scratch_dir}/../01-sarek/preprocessing/recalibrated/@@/@@.recal.cram -O ${scratch_dir}/@@_hsMetrics.out -VALIDATION_STRINGENCY LENIENT &" > _01_picardHsMetrics.sh
diff --git a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/lablog b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/lablog
index e8ca5a5b3..83ed5bbba 100755
--- a/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/lablog
+++ b/bu_isciii/templates/exomeeb/ANALYSIS/ANALYSIS01_EXOME/lablog
@@ -14,7 +14,7 @@ done < ./samples_id.txt
 
 mkdir -p 02-postprocessing 03-annotation 99-stats
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > sarek.sbatch
 #!/bin/sh
diff --git a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog
index e366b6d35..0bf87c35f 100644
--- a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog
+++ b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/02-postprocessing/lablog
@@ -3,7 +3,7 @@
 # Lablog to apply variant filters to combined GVCFs generated by SAREK (HaplotypeCaller)
 
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 mkdir -p logs
 
diff --git a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
index 5017cb561..79bde1ca1 100644
--- a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
+++ b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/03-annotation/lablog
@@ -1,7 +1,7 @@
 # module load singularity
 # module load Java/17.0.2.lua R/4.2.1
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 ln -s /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37-4.3/dbNSFP_ENSG_gene_GRCh37.txt
 ln -s /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37-4.3/dbNSFP_ENSG_plugin_hg19.txt
@@ -58,11 +58,11 @@ echo "rm variants_annot_filterAF.tab" >> aux_03_awk.sh
 #-------------------------------------------------------------------------------------------------------
 
 # 9. Running exomiser
-vcf_file=$(realpath ../02-postprocessing/variants_fil.vcf | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-ped_file=$(realpath ../../../DOC/family.ped | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+vcf_file=$(realpath ../02-postprocessing/variants_fil.vcf | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
+ped_file=$(realpath ../../../DOC/family.ped | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 proband=$(awk 'BEGIN{FS="\t"} $6 == 2 {print $2}' ../../../DOC/family.ped)
-bed_file=$(realpath ../../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37_mod.bed | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-output_folder=$(realpath ./exomiser/exomiser | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+bed_file=$(realpath ../../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37_mod.bed | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
+output_folder=$(realpath ./exomiser/exomiser | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 sed -i "s|VCF_FILE|${vcf_file}|g" ./exomiser_configfile.yml
 sed -i "s|PED_FILE|${ped_file}|g" ./exomiser_configfile.yml
diff --git a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog
index e3fc7690e..9739b1c7a 100644
--- a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog
+++ b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/99-stats/lablog
@@ -1,6 +1,6 @@
 # module load singularity
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 mkdir logs
 
 cat ../samples_id.txt | xargs -I @@ echo "srun --partition short_idx --mem 100G --time 2:00:00 --chdir ${scratch_dir} --output logs/PICARDHSMETRICS.@@.%j.log --job-name PICARDHSMETRICS singularity exec -B ${scratch_dir}/../../../ -B /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/ /data/ucct/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectHsMetrics -R /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37_decoy.fasta -BI ${scratch_dir}/../../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37.interval_list -TI ${scratch_dir}/../../../REFERENCES/Illumine_Exome_CEX_TargetedRegions_v1.2_modb37.interval_list -I ${scratch_dir}/../01-sarek/preprocessing/recalibrated/@@/@@.recal.cram -O ${scratch_dir}/@@_hsMetrics.out -VALIDATION_STRINGENCY LENIENT &" > _01_picardHsMetrics.sh
diff --git a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/lablog b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/lablog
index 2f3513917..ad3161803 100755
--- a/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/lablog
+++ b/bu_isciii/templates/exometrio/ANALYSIS/ANALYSIS01_EXOME/lablog
@@ -28,7 +28,7 @@ echo -e "patient,sex,status,sample,lane,fastq_1,fastq_2" > samplesheet.csv
 cat samples_id.txt | xargs -I % echo -e "%,XY,0,%,1,00-reads/%_R1.fastq.gz,00-reads/%_R2.fastq.gz" >> samplesheet.csv
 mkdir -p 02-postprocessing 03-annotation 99-stats
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > sarek.sbatch
 #!/bin/sh
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/01-preproQC/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/01-preproQC/lablog
index a496affd5..570ebed60 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/01-preproQC/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/01-preproQC/lablog
@@ -2,6 +2,6 @@
 
 mkdir logs
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --cpus-per-task 8 --time 01:00:00 --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../00-reads/"$in"_R1.fastq.gz ${scratch_dir}/../00-reads/"$in"_R2.fastq.gz &"; done > _01_rawfastqc.sh
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/03-procQC/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/03-procQC/lablog
index c860c2561..16b8e75c4 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/03-procQC/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/03-procQC/lablog
@@ -2,6 +2,6 @@
 
 mkdir logs
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz &"; done > _01_preprofastqc.sh
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/04-Alignment/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/04-Alignment/lablog
index d52189714..f18243d73 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/04-Alignment/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/04-Alignment/lablog
@@ -2,7 +2,7 @@
 
 mkdir logs
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --chdir $scratch_dir --output logs/BWAMEM.${in}.%j.log --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/bwa:0.7.17--he4a0461_11 bwa mem -t 20 REFERENCE_GENOME ${scratch_dir}/../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz -o ${scratch_dir}/${in}/${in}.sam &"; done >> _01_bwamem.sh
 
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/05-mark_dups/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/05-mark_dups/lablog
index edd952a14..d553cb1a0 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/05-mark_dups/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/05-mark_dups/lablog
@@ -2,7 +2,7 @@
 
 mkdir logs
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat ../samples_id.txt | while read in; do mkdir ${in}; echo "srun --partition short_idx --chdir $scratch_dir --output logs/PICARD_DUPLICATES.${in}.%j.log --mem 251346M --cpus-per-task 20 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard MarkDuplicates ASSUME_SORTED=true VALIDATION_STRINGENCY=LENIENT REMOVE_DUPLICATES=false INPUT=${scratch_dir}/../04-Alignment/${in}/${in}_sorted_rg.bam OUTPUT=${scratch_dir}/${in}/${in}_woduplicates.bam METRICS_FILE=${scratch_dir}/${in}/${in}_duplicates.stats TMP_DIR=${scratch_dir}/../../../TMP/${in} &"; done > _01_picard_dups.sh
 
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/06-freebayes/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/06-freebayes/lablog
index 6dde10961..649f633f7 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/06-freebayes/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/06-freebayes/lablog
@@ -2,7 +2,7 @@
 
 mkdir -p logs
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > freebayes.sbatch
 #!/bin/sh
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/07-snphylo/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/07-snphylo/lablog
index 34cc7337b..a05c15b6a 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/07-snphylo/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/07-snphylo/lablog
@@ -1,6 +1,6 @@
 # module load R/4.1.3
 
-scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
+scratch_dir=$(echo $PWD | sed 's/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g')
 
 mkdir logs
 
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/08-iqtree/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/08-iqtree/lablog
index 3eb5954ae..0e308a0c1 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/08-iqtree/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/08-iqtree/lablog
@@ -1,6 +1,6 @@
 # module load singularity
 
-scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
+scratch_dir=$(echo $PWD | sed 's/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g')
 mkdir log
 echo "srun --chdir ${scratch_dir} --output logs/IQTREEMFP.%j.log --job-name IQTREEMFP --cpus-per-task 20 --mem 5G --partition short_idx --time 00:30:00 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../07-snphylo/snphylo.output.fasta -m MFP &" > _00_iqtreemfp.sh
 echo "srun --chdir ${scratch_dir} --output logs/IQTREEFULLALIGN.%j.log --job-name IQTREEFULLALIGN --cpus-per-task 20 --mem 15G --partition short_idx --time 08:00:00 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../07-snphylo/snphylo.output.fasta -m PMB+F+R2 -T 20 -B 1000 -pre phylo.iqtree.bootstrap &" > _01_iqtreeall.sh
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/99-stats/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/99-stats/lablog
index 98989b223..476033697 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/99-stats/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS01_OUTBREAK/99-stats/lablog
@@ -1,6 +1,6 @@
 # module load singularity
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 mkdir -p logs
 mkdir samtools_flagstats
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/99-stats/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/99-stats/lablog
index 74f1c4941..aa6cc2d72 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/99-stats/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/99-stats/lablog
@@ -2,7 +2,7 @@
 
 cat ../../samples_id.txt | while read in; do ln -s ../*_mag/Taxonomy/kraken2/${in}/kraken2_report.txt ./${in}_kraken2_report.txt; done
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > multiqc.sbatch
 #!/bin/sh
diff --git a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog
index fc3789a6a..69dee18e6 100644
--- a/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog
+++ b/bu_isciii/templates/freebayes_outbreak/ANALYSIS/ANALYSIS02_MET/lablog
@@ -3,7 +3,7 @@ ln -s ../samples_id.txt .
 
 #module load Nextflow singularity
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > mag.sbatch
 #!/bin/sh
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/01-fastQC/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/01-fastQC/lablog
index a334d1e89..88683bd09 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/01-fastQC/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/01-fastQC/lablog
@@ -1,5 +1,5 @@
 # module load singularity
 
-scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
+scratch_dir=$(echo $PWD | sed 's/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g')
 mkdir logs
 cat ../samples_id.txt | xargs -I @@ echo "mkdir @@;srun --chdir ${scratch_dir} --output logs/FASTQC.@@.%j.log --job-name FASTQC --cpus-per-task 8 --mem 8192 --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/@@ --nogroup -t 8 -k 8 ${scratch_dir}/../00-reads/@@_R1.fastq.gz ${scratch_dir}/../00-reads/@@_R2.fastq.gz &" >> _01_fastqc.sh
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/03-preprocQC/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/03-preprocQC/lablog
index 4be9b022a..de8fb0666 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/03-preprocQC/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/03-preprocQC/lablog
@@ -1,5 +1,5 @@
 # module load singularity
 
-scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
+scratch_dir=$(echo $PWD | sed 's/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g')
 mkdir logs
 cat ../samples_id.txt | xargs -I @@ echo "mkdir @@;srun --chdir ${scratch_dir} --output logs/FASTQC.@@.%j.log --job-name FASTQC --cpus-per-task 8 --mem 8192 --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/@@ --nogroup -t 8 -k 8 ${scratch_dir}/../02-preprocessing/@@/@@_R1_filtered.fastq ${scratch_dir}/../02-preprocessing/@@/@@_R2_filtered.fastq &" >> _01_fastqc.sh
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/04-mapping/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/04-mapping/lablog
index 908810446..779c1e388 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/04-mapping/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/04-mapping/lablog
@@ -2,7 +2,7 @@
 
 mkdir logs
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 echo "Use bash lablog ../samples_id.txt"
 
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/05-samtools/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/05-samtools/lablog
index 04e55c81b..8490cc5d0 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/05-samtools/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/05-samtools/lablog
@@ -2,7 +2,7 @@
 
 mkdir logs
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 echo "Use bash lablog ../samples_id.txt"
 
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/06-VarScan/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/06-VarScan/lablog
index f47c75f19..cc52419ff 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/06-VarScan/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/06-VarScan/lablog
@@ -2,7 +2,7 @@
 
 mkdir logs
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 echo "Use bash lablog ../samples_id.txt"
 
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/07-annotation/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/07-annotation/lablog
index 1640cd2f5..65f7cce0d 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/07-annotation/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/07-annotation/lablog
@@ -1,6 +1,6 @@
 # module load singularity
 
-scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
+scratch_dir=$(echo $PWD | sed 's/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g')
 mkdir logs
 
 echo "Use bash lablog ../samples_id.txt"
diff --git a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/99-stats/lablog b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/99-stats/lablog
index 1ad62c614..9091852be 100644
--- a/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/99-stats/lablog
+++ b/bu_isciii/templates/lowfreq_panel/ANALYSIS/ANALYSIS01_RBPANEL/99-stats/lablog
@@ -1,6 +1,6 @@
 # module load singularity
 
-scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
+scratch_dir=$(echo $PWD | sed 's/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g')
 mkdir logs
 
 cat ../samples_id.txt | xargs -I @@ echo "srun --chdir ${scratch_dir} --output logs/PICARD.@@.%j.log --job-name PICARD --cpus-per-task 1 --mem 8192 --partition short_idx --time 02:00:00 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectHsMetrics -BI ${scratch_dir}/../../../REFERENCES/idt_rb1_panel_20221123.interval_list -TI ${scratch_dir}/../../../REFERENCES/idt_rb1_panel_20221123.interval_list -I ${scratch_dir}/../04-mapping/@@/@@_sorted.bam -O ${scratch_dir}/@@_hsMetrics.out -VALIDATION_STRINGENCY 'LENIENT' &" > _01_picardHsMetrics.sh
diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_TAXPROFILER/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_TAXPROFILER/lablog
index d08d846ff..879010d8d 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_TAXPROFILER/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS01_TAXPROFILER/lablog
@@ -51,7 +51,7 @@ cat samples_id.txt | while read in; do
 	echo "${in},run1,ILLUMINA,00-reads/${in}_R1.fastq.gz,00-reads/${in}_R2.fastq.gz,"
 done >> samplesheet.csv
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 # slurm sbatch file setup
 cat <<EOF > taxprofiler.sbatch
diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/99-stats/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/99-stats/lablog
index 94231de1a..a9daa731f 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/99-stats/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/99-stats/lablog
@@ -2,7 +2,7 @@
 
 cat ../../samples_id.txt | while read in; do ln -s ../*_mag/Taxonomy/kraken2/${in}/${in}.kraken2_report.txt .; done
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > multiqc.sbatch
 #!/bin/sh
diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog
index b641a1d25..6dddb048c 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS02_MAG_TAXONOMICS/lablog
@@ -11,7 +11,7 @@ done >> samplesheet.csv
 #module load Nextflow
 #module load singularity
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > mag.sbatch
 #!/bin/sh
diff --git a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
index 754af025c..1f57ae768 100644
--- a/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
+++ b/bu_isciii/templates/mag/ANALYSIS/ANALYSIS03_MAG_ALL/lablog
@@ -8,7 +8,7 @@ cat samples_id.txt | while read in; do
 	echo "${in},,00-reads/${in}_R1.fastq.gz,00-reads/${in}_R2.fastq.gz,"
 done >> samplesheet.csv
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > mag_all.sbatch
 #!/bin/sh
diff --git a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/02-kmerfinder/lablog b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/02-kmerfinder/lablog
index cbc97034f..f94fe55f2 100644
--- a/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/02-kmerfinder/lablog
+++ b/bu_isciii/templates/mtbseq/ANALYSIS/ANALYSIS01_MTBSEQ/02-kmerfinder/lablog
@@ -1,6 +1,6 @@
 # module load singularity
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 mkdir logs
 
diff --git a/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog b/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog
index d722b0b99..3074c0bcd 100644
--- a/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog
+++ b/bu_isciii/templates/pikavirus/ANALYSIS/ANALYSIS01_PIKAVIRUS/lablog
@@ -6,7 +6,7 @@ echo "sample,fastq_1,fastq_2" > samplesheet.csv
 cat samples_id.txt | while read in; do echo "${in},00-reads/${in}_R1.fastq.gz,00-reads/${in}_R2.fastq.gz"; done >> samplesheet.csv
 
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > pikavirus.sbatch
 #!/bin/sh
diff --git a/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/lablog b/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/lablog
index 4e45d1ac0..92e188605 100644
--- a/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/lablog
+++ b/bu_isciii/templates/plasmidid/ANALYSIS/ANALYSIS02_PLASMIDID/lablog
@@ -1,7 +1,7 @@
 # module load singularity
 
 mkdir logs
-scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
+scratch_dir=$(echo $PWD | sed 's/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g')
 ln -s ../samples_id.txt .
 
 cat ../samples_id.txt | xargs -I @@ echo "srun --chdir $scratch_dir --output logs/PLASMIDID.@@.%j.log --job-name PLASMIDID_@@ --partition short_idx --time 05:00:00 env - PATH="$PATH" singularity exec --bind /data/ucct/bi/references/ --bind ${scratch_dir} --bind ${scratch_dir}/../../ /data/ucct/bi/pipelines/singularity-images/depot.galaxyproject.org-singularity-plasmidid-1.6.5--hdfd78af_0.img plasmidID -1 ${scratch_dir}/../*ASSEMBLY/01-processing/fastp/@@_1.fastp.fastq.gz -2 ${scratch_dir}/../*ASSEMBLY/01-processing/fastp/@@_2.fastp.fastq.gz -d /data/ucct/bi/references/plasmidID/plasmid_ddbb/20200203/20200203_plasmids.fasta -s @@ -c ${scratch_dir}/../*ASSEMBLY/03-assembly/unicycler/@@.fasta -a ${scratch_dir}/plasmidID_annotation_config_file.txt --no-trim -o ${scratch_dir} &" > _01_plasmidID.sh
diff --git a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/lablog b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/lablog
index f6694c137..62ed7b42a 100644
--- a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/lablog
+++ b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/02-differential_expression/lablog
@@ -3,5 +3,5 @@
 COUNTS=$(find ../*rnaseq/ -maxdepth 0 -type d)
 cat comparatives.txt | tr '\t' '_' | while read in; do mkdir ${in}; cp differential_expression.R ${in}/ ; done
 cat comparatives.txt | while read in; do arr=($in); echo "mkdir logs" > ${arr[0]}_${arr[1]}_${arr[2]}/lablog; done
-cat comparatives.txt | while read in; do arr=($in); echo 'scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")' >> ${arr[0]}_${arr[1]}_${arr[2]}/lablog; done
+cat comparatives.txt | while read in; do arr=($in); echo 'scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")' >> ${arr[0]}_${arr[1]}_${arr[2]}/lablog; done
 cat comparatives.txt | sed 's/-/,/g' | while read in; do arr=($in); echo "echo \"srun --partition short_idx --chdir \$scratch_dir --output logs/DESEQ2.%j.log Rscript differential_expression.R -r ../${COUNTS} -d 'DEG' -t '${arr[1]}' -c '${arr[2]}' &\" > _01_deseq2.sh" >> ${arr[0]}_${arr[1]}_${arr[2]}/lablog; done
diff --git a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog
index 168c45fb5..d94351850 100644
--- a/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog
+++ b/bu_isciii/templates/rnaseq/ANALYSIS/DATE_ANALYSIS01_RNASEQ/lablog
@@ -5,7 +5,7 @@ cat samples_id.txt | while read in; do echo "${in},00-reads/${in}_R1.fastq.gz,00
 
 #module load Nextflow singularity
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > rnaseq.sbatch
 #!/bin/sh
diff --git a/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog b/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog
index 68ec350e3..948a4a5c5 100644
--- a/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog
+++ b/bu_isciii/templates/seek_and_destroy/ANALYSIS/ANALYSIS01_SEEK_DESTROY/lablog
@@ -7,7 +7,7 @@ ln -s ../samples_id.txt .
 echo "sample,fastq_1,fastq_2" > samplesheet.csv
 cat samples_id.txt | while read in; do echo "${in},00-reads/${in}_R1.fastq.gz,00-reads/${in}_R2.fastq.gz"; done >> samplesheet.csv
 
-scratch_dir=$(echo $(pwd) | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $(pwd) | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > seek_destroy.sbatch
 #!/bin/sh
diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/01-fastqc/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/01-fastqc/lablog
index 3ffb0cd3b..9889fb5e9 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/01-fastqc/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/01-fastqc/lablog
@@ -2,6 +2,6 @@
 
 mkdir logs
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --cpus-per-task 8 --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ -B /srv/fastq_repo/ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../00-reads/"$in"_R1.fastq.gz ${scratch_dir}/../00-reads/"$in"_R2.fastq.gz &"; done > _01_rawfastqc.sh
diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/03-preprocQC/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/03-preprocQC/lablog
index 938fb2161..7628729cb 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/03-preprocQC/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/03-preprocQC/lablog
@@ -2,6 +2,6 @@
 
 mkdir logs
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat ../samples_id.txt | while read in; do echo "mkdir $in; srun --partition short_idx --cpus-per-task 8 --chdir $scratch_dir --output logs/FASTQC.${in}.%j.log singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/fastqc:0.11.9--hdfd78af_1 fastqc -o ${scratch_dir}/$in --nogroup -t 8 -k 8 ${scratch_dir}/../02-preprocessing/${in}/${in}_R1_filtered.fastq.gz ${scratch_dir}/../02-preprocessing/${in}/${in}_R2_filtered.fastq.gz &"; done > _01_trimmedfastqc.sh
diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog
index 071496b97..e9f837feb 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/04-snippy/lablog
@@ -1,6 +1,6 @@
 # module load singularity
 
-scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
+scratch_dir=$(echo $PWD | sed 's/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g')
 
 mkdir logs
 
diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog
index 756b8b09f..d1efc0934 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/05-iqtree/lablog
@@ -1,6 +1,6 @@
 # module load singularity
 
-scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
+scratch_dir=$(echo $PWD | sed 's/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g')
 mkdir logs
 #echo "srun --chdir ${scratch_dir} --output logs/IQTREEMFP.%j.log --job-name IQTREEMFP --cpus-per-task 20 --mem 5G --partition short_idx --time 00:30:00 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../04-snippy/phylo.aln -m MFP &" > _00_iqtreemfp.sh
 echo "srun --chdir ${scratch_dir} --output logs/IQTREEFULLALIGN.%j.log --job-name IQTREEFULLALIGN --cpus-per-task 20 --mem 15G --partition short_idx --time 08:00:00 singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/iqtree:2.1.4_beta--hdcc8f71_0 iqtree -s ${scratch_dir}/../04-snippy/phylo.aln -m HKY+F+I -T 20 -B 1000 -pre phylo.iqtree.bootstrap &" > _01_iqtreeall.sh
diff --git a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/99-stats/lablog b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/99-stats/lablog
index 1739247ee..57caf0d43 100644
--- a/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/99-stats/lablog
+++ b/bu_isciii/templates/snippy/ANALYSIS/ANALYSIS01_SNIPPY/99-stats/lablog
@@ -2,7 +2,7 @@
 
 ln -s ../../../REFERENCES/*.fna reference.fna
 mkdir logs
-scratch_dir=$(echo $PWD | sed 's/\/data\/bi\/scratch_tmp/\/scratch/g')
+scratch_dir=$(echo $PWD | sed 's/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g')
 
 cat ../samples_id.txt | xargs -I % echo "printf '%s\t' %;singularity exec -B ${scratch_dir}/../../../ /data/ucct/bi/pipelines/singularity-images/samtools:1.16.1--h6899075_1 samtools flagstat ${scratch_dir}/../04-snippy/%/snps.bam | grep 'mapped (' | head -n 1 | cut -d '(' -f 2 | cut -d ':' -f 1" | bash | sort -u > mapping_stats.txt
 
diff --git a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
index 2a829ba76..6f8c21dc8 100644
--- a/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
+++ b/bu_isciii/templates/viralrecon/ANALYSIS/lablog_viralrecon
@@ -484,7 +484,7 @@ do
     echo "ln -s ../00-reads ." > ${FOLDER_NAME}/lablog
     printf "ln -s ../samples_id.txt .\n\n" >> ${FOLDER_NAME}/lablog
     printf "#module load Nextflow singularity\n\n" >> ${FOLDER_NAME}/lablog
-    printf 'scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")\n\n' >> ${FOLDER_NAME}/lablog
+    printf 'scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")\n\n' >> ${FOLDER_NAME}/lablog
     cut -f2 ${FOLDER_NAME}/samples_ref.txt | sort -u | while read ref
     do
         echo "sample,fastq_1,fastq_2" > ${FOLDER_NAME}/samplesheet_${ref}.csv
diff --git a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/02-postprocessing/lablog b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/02-postprocessing/lablog
index 0c971e16e..bdb99167c 100644
--- a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/02-postprocessing/lablog
+++ b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/02-postprocessing/lablog
@@ -2,7 +2,7 @@
 
 # module load singularity
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 mkdir -p logs
 
diff --git a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/03-annotation/lablog b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/03-annotation/lablog
index 246e919a5..93774e4ab 100644
--- a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/03-annotation/lablog
+++ b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/03-annotation/lablog
@@ -1,7 +1,7 @@
 # module load singularity
 # module load Java/17.0.2.lua R/4.2.1
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 ln -s /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37-4.3/dbNSFP_ENSG_gene_GRCh37.txt
 ln -s /data/ucct/bi/references/eukaria/homo_sapiens/cache_vep/custom_databases/dbNSFP/GRCh37-4.3/dbNSFP_ENSG_plugin_hg19.txt
@@ -62,10 +62,10 @@ echo "rm variants_annot_filterAF.tab" >> aux_03_awk.sh
 
 ## 7. Running exomiser
 
-vcf_file=$(realpath ../02-postprocessing/variants_fil.vcf | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-ped_file=$(realpath ../../../DOC/family.ped | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+vcf_file=$(realpath ../02-postprocessing/variants_fil.vcf | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
+ped_file=$(realpath ../../../DOC/family.ped | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 proband=$(awk 'BEGIN{FS="\t"} $6 == 2 {print $2}' ../../../DOC/family.ped)
-output_folder=$(realpath ./exomiser/exomiser/exomiser | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+output_folder=$(realpath ./exomiser/exomiser/exomiser | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 sed -i "s|VCF_FILE|${vcf_file}|g" ./exomiser_configfile.yml
 sed -i "s|PED_FILE|${ped_file}|g" ./exomiser_configfile.yml
@@ -78,11 +78,11 @@ echo "srun --partition short_idx --mem 350G --time 12:00:00 --chdir /data/ucct/b
 
 ## 8. Running exomiser_exome
 
-vcf_file=$(realpath ../02-postprocessing/variants_fil.vcf | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-ped_file=$(realpath ../../../DOC/family.ped | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+vcf_file=$(realpath ../02-postprocessing/variants_fil.vcf | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
+ped_file=$(realpath ../../../DOC/family.ped | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 proband=$(awk 'BEGIN{FS="\t"} $6 == 2 {print $2}' ../../../DOC/family.ped)
-bed_file=$(realpath ../../../REFERENCES/exomiser_exome.bed | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-output_folder=$(realpath ./exomiser/exomiser_exome/exomiser_exome | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+bed_file=$(realpath ../../../REFERENCES/exomiser_exome.bed | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
+output_folder=$(realpath ./exomiser/exomiser_exome/exomiser_exome | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 sed -i "s|VCF_FILE|${vcf_file}|g" ./exomiser_configfile_exome.yml
 sed -i "s|PED_FILE|${ped_file}|g" ./exomiser_configfile_exome.yml
@@ -95,11 +95,11 @@ echo "srun --partition short_idx --mem 350G --time 12:00:00 --chdir /data/ucct/b
 
 ## 9. Running exomiser_genes
 
-vcf_file=$(realpath ../02-postprocessing/variants_fil.vcf | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-ped_file=$(realpath ../../../DOC/family.ped | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+vcf_file=$(realpath ../02-postprocessing/variants_fil.vcf | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
+ped_file=$(realpath ../../../DOC/family.ped | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 proband=$(awk 'BEGIN{FS="\t"} $6 == 2 {print $2}' ../../../DOC/family.ped)
-bed_file=$(realpath ../../../REFERENCES/exomiser_genes.bed | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
-output_folder=$(realpath ./exomiser/exomiser_genes/exomiser_genes | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+bed_file=$(realpath ../../../REFERENCES/exomiser_genes.bed | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
+output_folder=$(realpath ./exomiser/exomiser_genes/exomiser_genes | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 sed -i "s|VCF_FILE|${vcf_file}|g" ./exomiser_configfile_genes.yml
 sed -i "s|PED_FILE|${ped_file}|g" ./exomiser_configfile_genes.yml
diff --git a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/99-stats/lablog b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/99-stats/lablog
index 08dc70415..5bc35ea0a 100644
--- a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/99-stats/lablog
+++ b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/99-stats/lablog
@@ -1,6 +1,6 @@
 # module load singularity
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 mkdir logs
 
 cat ../samples_id.txt | xargs -I @@ echo "srun --partition short_idx --mem 100G --time 2:00:00 --chdir ${scratch_dir} --output logs/PICARDHSMETRICS.@@.%j.log --job-name PICARDHSMETRICS singularity exec -B ${scratch_dir}/../../../ -B /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/ /data/ucct/bi/pipelines/singularity-images/picard:2.25.1--hdfd78af_1 picard CollectHsMetrics -R /data/ucct/bi/references/eukaria/homo_sapiens/hg19/1000genomes_b37/genome/human_g1k_v37_decoy.fasta -BI ${scratch_dir}/../../../REFERENCES/exomiser_exome_mod.interval_list -TI ${scratch_dir}/../../../REFERENCES/exomiser_exome_mod.interval_list -I ${scratch_dir}/../01-sarek/preprocessing/recalibrated/@@/@@.recal.cram -O ${scratch_dir}/@@_hsMetrics.out -VALIDATION_STRINGENCY LENIENT &" > _01_picardHsMetrics.sh
diff --git a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/lablog b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/lablog
index 7fbc9ebfd..ec0a546d2 100755
--- a/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/lablog
+++ b/bu_isciii/templates/wgstrio/ANALYSIS/ANALYSIS01_GENOME/lablog
@@ -30,7 +30,7 @@ cat samples_id.txt | xargs -I % echo -e "%,XY,0,%,1,00-reads/%_R1.fastq.gz,00-re
 mkdir -p 02-postprocessing 03-annotation 99-stats
 
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > sarek.sbatch
 #!/bin/sh
diff --git a/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog b/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog
index 0de333a1d..c8e2f5246 100644
--- a/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog
+++ b/tests/archived/bi/research/20230101_TESTRESEARCHP_smonzon_C/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog
@@ -15,7 +15,7 @@ echo "sample,fastq_1,fastq_2" > samplesheet.csv
 cat samples_id.txt | while read in; do echo "${in},00-reads/${in}_R1.fastq.gz,00-reads/${in}_R2.fastq.gz"; done >> samplesheet.csv
 
 #module load Nextflow singularity
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > assembly.sbatch
 #!/bin/sh
diff --git a/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog b/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog
index 0de333a1d..c8e2f5246 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog
+++ b/tests/archived/bi/services_and_colaborations/CNM/bacteriology/SRVCNM787_20221205_ASSEMBLY315_lherrera_S/ANALYSIS/20221205_ANALYSIS01_ASSEMBLY/lablog
@@ -15,7 +15,7 @@ echo "sample,fastq_1,fastq_2" > samplesheet.csv
 cat samples_id.txt | while read in; do echo "${in},00-reads/${in}_R1.fastq.gz,00-reads/${in}_R2.fastq.gz"; done >> samplesheet.csv
 
 #module load Nextflow singularity
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > assembly.sbatch
 #!/bin/sh
diff --git a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS02_METAGENOMIC_HUMAN/lablog b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS02_METAGENOMIC_HUMAN/lablog
index 4bb83f62c..9f8c0d980 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS02_METAGENOMIC_HUMAN/lablog
+++ b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS02_METAGENOMIC_HUMAN/lablog
@@ -3,7 +3,7 @@ ln -s ../samples_id.txt .
 
 #module load Nextflow singularity
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > RotavirusA_11segments_viralrecon.sbatch
 #!/bin/sh
diff --git a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS03_MAG/lablog b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS03_MAG/lablog
index 78abe5121..160448141 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS03_MAG/lablog
+++ b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221205_ANALYSIS03_MAG/lablog
@@ -3,7 +3,7 @@ ln -s ../samples_id.txt .
 
 #module load Nextflow singularity
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > mag.sbatch
 #!/bin/sh
diff --git a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST/lablog b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST/lablog
index 2d817bebc..8cdb52c92 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST/lablog
+++ b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/20221207_ANALYSIS04_BLAST/lablog
@@ -1,5 +1,5 @@
 #module load BLAST+/2.11.0-gompi-2020b
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 mkdir logs
 
diff --git a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/lablog b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/lablog
index 0fc44fd73..0fd93a108 100644
--- a/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/lablog
+++ b/tests/archived/bi/services_and_colaborations/CNM/virology/SRVCNM786_20221205_GENOMEORTHORNAVIRAE02_mdfernandez_S/ANALYSIS/lablog
@@ -16,7 +16,7 @@ do
     printf "ln -s ../samples_id.txt .\n\n" >> ${FOLDER_NAME}/lablog
     echo "#module load Nextflow singularity" >> ${FOLDER_NAME}/lablog
     echo "" >> ${FOLDER_NAME}/lablog
-    printf 'scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")\n\n' >> ${FOLDER_NAME}/lablog
+    printf 'scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")\n\n' >> ${FOLDER_NAME}/lablog
     cut -f2 ${FOLDER_NAME}/samples_ref.txt | sort -u | while read ref
     do
         echo "sample,fastq_1,fastq_2" > ${FOLDER_NAME}/samplesheet_${ref}.csv
diff --git a/tests/data/bi/services_and_colaborations/CNM/bacteriology/SRVCNM983_20240228_TEST001_bioinfoadm_S/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog b/tests/data/bi/services_and_colaborations/CNM/bacteriology/SRVCNM983_20240228_TEST001_bioinfoadm_S/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
index f96f271b0..5e153a1dd 100644
--- a/tests/data/bi/services_and_colaborations/CNM/bacteriology/SRVCNM983_20240228_TEST001_bioinfoadm_S/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
+++ b/tests/data/bi/services_and_colaborations/CNM/bacteriology/SRVCNM983_20240228_TEST001_bioinfoadm_S/ANALYSIS/ANALYSIS01_ASSEMBLY/lablog
@@ -92,7 +92,7 @@ cat samples_id.txt | while read in; do
     fi
 done >> samplesheet.csv
 
-scratch_dir=$(echo $PWD | sed "s/\/data\/bi\/scratch_tmp/\/scratch/g")
+scratch_dir=$(echo $PWD | sed "s/\/data\/ucct\/bi\/scratch_tmp/\/scratch/g")
 
 cat <<EOF > assembly.sbatch
 #!/bin/sh

From 4062a53819f88d5cdeee8c0a3b50d3dfa83fb1df Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Tue, 24 Dec 2024 11:14:23 +0100
Subject: [PATCH 318/321] Updated CHANGELOG.md

---
 CHANGELOG.md | 23 +++++++++++++++++++++++
 1 file changed, 23 insertions(+)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 154251f8e..5a0fd384b 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -4,6 +4,29 @@ All notable changes to this project will be documented in this file.
 
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/), and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
+## [2.2.4dev] - 2024-0X-XX : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.2.4
+
+### Credits
+
+- [Victor Lopez](https://github.com/victor5lm)
+
+### Template fixes and updates
+
+- Replaced /data/bi/ by /data/ucct/bi where necessary [#385](https://github.com/BU-ISCIII/buisciii-tools/pull/385).
+- Removed middle_obx from config files [#385](https://github.com/BU-ISCIII/buisciii-tools/pull/385).
+
+### Modules
+
+#### Added enhancements
+
+#### Fixes
+
+#### Changed
+
+#### Removed
+
+### Requirements
+
 ## [2.X.Xhot] - 2024-0X-0X : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.X.3
 
 ### Credits

From 4b5ff10a953c31dfa44a779d6d168177942318ae Mon Sep 17 00:00:00 2001
From: victor5lm <victor_lopez_5@hotmail.com>
Date: Fri, 27 Dec 2024 10:55:08 +0100
Subject: [PATCH 319/321] Updated CHANGELOG.md, setup.py and __main__.py for
 the new release

---
 CHANGELOG.md          | 22 +---------------------
 bu_isciii/__main__.py |  2 +-
 setup.py              |  2 +-
 3 files changed, 3 insertions(+), 23 deletions(-)

diff --git a/CHANGELOG.md b/CHANGELOG.md
index 5a0fd384b..97ead2a86 100755
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -4,7 +4,7 @@ All notable changes to this project will be documented in this file.
 
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/), and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
-## [2.2.4dev] - 2024-0X-XX : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.2.4
+## [2.2.4] - 2024-12-27 : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.2.4
 
 ### Credits
 
@@ -27,26 +27,6 @@ The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 
 ### Requirements
 
-## [2.X.Xhot] - 2024-0X-0X : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.X.3
-
-### Credits
-
-Code contributions to the hotfix:
-
-### Template fixes and updates
-
-### Modules
-
-#### Added enhancements
-
-#### Fixes
-
-#### Changed
-
-#### Removed
-
-### Requirements
-
 ## [2.2.3] - 2024-12-23 : https://github.com/BU-ISCIII/buisciii-tools/releases/tag/2.2.3
 
 ### Credits
diff --git a/bu_isciii/__main__.py b/bu_isciii/__main__.py
index 283f797c7..f06da05e5 100755
--- a/bu_isciii/__main__.py
+++ b/bu_isciii/__main__.py
@@ -57,7 +57,7 @@ def run_bu_isciii():
     )
 
     # stderr.print("[green]                                          `._,._,'\n", highlight=False)
-    __version__ = "2.2.3"
+    __version__ = "2.2.4"
     stderr.print(
         "[grey39]    BU-ISCIII-tools version {}".format(__version__), highlight=False
     )
diff --git a/setup.py b/setup.py
index 5e35992b5..483ba2e5c 100755
--- a/setup.py
+++ b/setup.py
@@ -2,7 +2,7 @@
 
 from setuptools import setup, find_packages
 
-version = "2.2.3"
+version = "2.2.4"
 
 with open("README.md") as f:
     readme = f.read()

From 4615be7e89a9848e512894ed806c6efa38679167 Mon Sep 17 00:00:00 2001
From: "github-actions[bot]"
 <41898282+github-actions[bot]@users.noreply.github.com>
Date: Fri, 27 Dec 2024 12:23:37 +0100
Subject: [PATCH 320/321] Merge changes from main into hotfix (#195) (#388)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com>
Co-authored-by: Sara Monzón <sara.monzon.fdz@gmail.com>
Co-authored-by: Pablo Mata <76519482+Shettland@users.noreply.github.com>
Co-authored-by: Víctor López <98259577+victor5lm@users.noreply.github.com>

From 56ec138b09a65696b4a4a4c2801fd5c7643ae48a Mon Sep 17 00:00:00 2001
From: "github-actions[bot]"
 <41898282+github-actions[bot]@users.noreply.github.com>
Date: Thu, 1 Feb 2024 13:58:18 +0100
Subject: [PATCH 321/321] Merge changes from main into hotfix (#195)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: Sara Monzón <sara.monzon.fdz@gmail.com>