diff --git a/CHANGELOG.md b/CHANGELOG.md
index c3d90bc..3173f7c 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -2,15 +2,39 @@
 
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/)
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
+Naming based on: [Mythical creatures](https://en.wikipedia.org/wiki/List_of_legendary_creatures_by_type).
 
-## v1.0dev - [date]
+## v1.0.0 - Aquatic Bahamut [21/08/2024]
 
 Initial release of sanger-tol/ear, created with the [nf-core](https://nf-co.re/) template.
+The current pipeline means the MVP for ear.
 
-### `Added`
+### Added
+GFASTATS to generate statistics on the input primary genome.
+MERQURY_FK to generate kmer graphs and analyses of the primary, haplotype and merged assembly.
+BLOBTOOLKIT to generate busco files and blobtoolkit dataset/plots.
+CURATIONPRETEXT to generate pretext plots and pngs.
 
-### `Fixed`
+### Parameters
 
-### `Dependencies`
+| Old parameter   | New parameter |
+| --------------- | ------------- |
+|                 | --mapped      |
 
-### `Deprecated`
+### Software dependencies
+
+| Dependency  | Old version   | New version   |
+| ----------- | ------------- | ------------- |
+| sanger-tol/blobtoolkit* |               | draft_assemblies        |
+| sanger-tol/curationpretext* |   |  1.0.0 (UNSC Cradle) |
+| GFASTATS |  | 1.3.6--hdcf5f25_3   |
+| MERQUERY_FK  | | 1.2   |
+| MINIMAP2_ALIGN |  | 2.28  |
+| SAMTOOLS_MERGE |  | 1.20--h50ea8bc_0 |
+| SAMTOOLS_SORT  |  | 1.20--h50ea8bc_0 |
+| 
+
+- Note: for pipelines, please check their own CHANGELOG file for a full list of software dependencies.
+
+### Dependencies
+The pipeline depends on a number of databases which are noted in  [README](README.md) and [USAGE](docs/usage.md).
diff --git a/README.md b/README.md
index 506512d..652eba6 100644
--- a/README.md
+++ b/README.md
@@ -10,51 +10,74 @@
 
 ## Introduction
 
-**sanger-tol/ear** is a bioinformatics pipeline that ...
+**sanger-tol/ear** is a bioinformatics pipeline that generates the data files required for the the generation of ERGA Assembly Reports. Sanger-tol/ear nests two other sanger-tol pipelines (blobtoolkit and curationpretext).
 
-<!-- TODO nf-core:
-   Complete this sentence with a 2-3 sentence summary of what types of data the pipeline ingests, a brief overview of the
-   major pipeline sections and the types of output it produces. You're giving an overview to someone new
-   to nf-core here, in 15-20 seconds. For an example, see https://github.com/nf-core/rnaseq/blob/master/README.md#introduction
--->
-
-<!-- TODO nf-core: Include a figure that guides the user through the major workflow steps. Many nf-core
-     workflows use the "tube map" design for that. See https://nf-co.re/docs/contributing/design_guidelines#examples for examples.   -->
-<!-- TODO nf-core: Fill in short bullet-pointed list of the default steps in the pipeline -->
-
-1. Read QC ([`FastQC`](https://www.bioinformatics.babraham.ac.uk/projects/fastqc/))
-2. Present QC for raw reads ([`MultiQC`](http://multiqc.info/))
+1. Read the input yaml file (YAML_INPUT)
+2. Run GFASTATS (GFASTARS)
+3. Run MERQURYFK_MERQURYFK (MERQURYFK)
+4. Run MAIN_MAPPING, longread single-end/paired-end mapping 
+5. Run GENERATE_SAMPLESHEET, generate a csv file required for SANGER_TOL_BTK.
+6. Run SANGER_TOL_BTK, also known as SANGER-TOL/BLOBTOOLKIT a subpipline for SANGER-TOL/EAR
+7. Run SANGER_TOL_CPRETEXT, also known as SANGER-TOL/CURATIONPRETEXT a subpipeline for SANGER-TOL/EAR.
 
 ## Usage
 
 > [!NOTE]
 > If you are new to Nextflow and nf-core, please refer to [this page](https://nf-co.re/docs/usage/installation) on how to set-up Nextflow. Make sure to [test your setup](https://nf-co.re/docs/usage/introduction#how-to-run-a-pipeline) with `-profile test` before running the workflow on actual data.
 
-<!-- TODO nf-core: Describe the minimum required steps to execute the pipeline, e.g. how to prepare samplesheets.
-     Explain what rows and columns represent. For instance (please edit as appropriate):
-
-First, prepare a samplesheet with your input data that looks as follows:
-
-`samplesheet.csv`:
-
-```csv
-sample,fastq_1,fastq_2
-CONTROL_REP1,AEG588A1_S1_L002_R1_001.fastq.gz,AEG588A1_S1_L002_R2_001.fastq.gz
+The sanger-tol/ear pipeline requires a number of databases in place in order to run the blobtoolkit pipeline.
+These include:
+   - A blast nt database
+   - A Diamond blast uniprot database
+   - A Diamond blast nr database
+   - An NCBI taxdump
+   - An NCBI rankedlineage.dmp
+
+Next, a yaml file containing the following should then be completed:
+
+```yaml
+# General Vales for all subpiplines and modules
+assembly_id: <NAME OF ASSEMBLY>
+reference_hap1: <LOCATION OF PRIMARY ASSEMBLY FILE .FA>
+reference_hap2: <LOCATION OF HAPLOTYPE ASSEBMLY FILE .FA>
+reference_haplotigs: <LOCATION OF THE HAPLOTIGS FILE, REMOVED DURING CURATION .FA>
+
+# If a mapped bam already exists use the below + --mapped TRUE on the nextflow command else ignore it and the pipeline will create it.
+mapped_bam: <MAPPED BAM .BAM>
+
+merquryfk:
+  fastk_hist: <THE PATH TO THE .HIST FILE>
+  fastk_ktab: <PATH TO THE DIRECTORY CONTAINING THE KTAB FILES, ENSURE THE HIDDEN FILES ARE HERE TOO>
+
+# Used by both subpipelines
+longread:
+  type: <hifi|clr|ont|illumina>
+  dir: <DIRECTORY OF LONGREAD FILES .FASTA.GZ>
+curationpretext:
+  aligner: <minimap2|BWAMEM>
+  telomere_motif: <TELOMERE MOTIF OF SAMPLE>
+  hic_dir: <DIRECTORY OF HIC READ FILES .CRAM AND .CRAI>
+btk:
+  taxid: 1464561
+  lineages: <CSV LIST OF DATABASES TO USE: "insecta_odb10,diptera_odb10">
+  gca_accession: GCA_0001 <DEFAULT, DO NOT CHANGE UNLESS YOU HAVE A GCA_ACCESSION FOR YOUR SPECIES>
+  nt_database: <DIRECTORY CONTAINING BLAST DB>
+  nt_database_prefix: <BLASTDB PREFIX>
+  diamond_uniprot_database_path: <PATH TO reference_proteomes.dmnd FROM UNIPROT>
+  diamond_nr_database_path: <PATH TO nr.dmnd>
+  ncbi_taxonomy_path: <DIRECTORY CONTAINING THE TAXDUMP>
+  ncbi_rankedlineage_path: <FOLDER CONTAINING THE rankedlineage.dmp FILE>
+  config: <PATH TO ear/conf/sanger-tol-btk.config TO OVERWRITE PROCESS LIMITS>
 ```
 
-Each row represents a fastq file (single-end) or a pair of fastq files (paired end).
-
--->
 
 Now, you can run the pipeline using:
 
-<!-- TODO nf-core: update the following command to include all required parameters for a minimal example -->
-
 ```bash
-nextflow run sanger-tol/ear \
-   -profile <docker/singularity/.../institute> \
-   --input samplesheet.csv \
-   --outdir <OUTDIR>
+nextflow run sanger-tol/ear -profile <singularity,docker> \\
+   --input assets/idCulLati1.yaml \\
+   --mapped TRUE \\ # OPTIONAL
+   --outdir test-truth
 ```
 
 > [!WARNING]
@@ -65,10 +88,6 @@ nextflow run sanger-tol/ear \
 
 sanger-tol/ear was originally written by DLBPointon.
 
-We thank the following people for their extensive assistance in the development of this pipeline:
-
-<!-- TODO nf-core: If applicable, make list of people who have also contributed -->
-
 ## Contributions and Support
 
 If you would like to contribute to this pipeline, please see the [contributing guidelines](.github/CONTRIBUTING.md).
diff --git a/assets/idCulLati1.yaml b/assets/idCulLati1.yaml
new file mode 100644
index 0000000..ea48cc2
--- /dev/null
+++ b/assets/idCulLati1.yaml
@@ -0,0 +1,33 @@
+# General Vales for all subpiplines and modules
+assembly_id: idCulLati1_ear
+reference_hap1: /nfs/treeoflife-01/teams/tola/users/dp24/ear/idCulLati1/primary.fa
+reference_hap2: /nfs/treeoflife-01/teams/tola/users/dp24/ear/idCulLati1/hap2.fa
+reference_haplotigs: /
+
+# If a mapped bam already exists use the below + --mapped TRUE on the nextflow command else ignore.
+mapped_bam: /nfs/treeoflife-01/teams/tola/users/dp24/ear/idCulLati1/mapped_bam.bam
+
+merquryfk:
+  fastk_hist: /lustre/scratch122/tol/data/a/5/e/1/6/d/Culex_laticinctus/genomic_data/idCulLati1/pacbio/kmer/k31/idCulLati1.k31.hist
+  fastk_ktab: /lustre/scratch122/tol/data/a/5/e/1/6/d/Culex_laticinctus/genomic_data/idCulLati1/pacbio/kmer/k31/
+
+# Used by both subpipelines
+longread:
+  type: hifi
+  dir: /lustre/scratch122/tol/data/a/5/e/1/6/d/Culex_laticinctus/genomic_data/idCulLati1/pacbio/fasta/
+curationpretext:
+  aligner: minimap2
+  telomere_motif: TTAGG
+  hic_dir: /lustre/scratch122/tol/data/a/5/e/1/6/d/Culex_laticinctus/genomic_data/idCulLati2/hic-arima2/
+btk:
+  taxid: 1464561
+  lineages: "insecta_odb10"
+  gca_accession: GCA_0001
+  nt_database: /data/blastdb/Supported/NT/current
+  nt_database_prefix: nt
+  diamond_uniprot_database_path: /lustre/scratch123/tol/resources/uniprot_reference_proteomes/latest/reference_proteomes.dmnd
+  diamond_nr_database_path: /lustre/scratch123/tol/resources/nr/latest/nr.dmnd
+  ncbi_taxonomy_path: /lustre/scratch123/tol/resources/taxonomy/latest/new_taxdump/
+  ncbi_rankedlineage_path: /lustre/scratch123/tol/resources/taxonomy/latest/new_taxdump/rankedlineage.dmp
+  btk_yaml: /nfs/users/nfs_d/dp24/sanger-tol-ear/assets/btk_draft.yaml
+  config: /nfs/treeoflife-01/teams/tola/users/dp24/ear/conf/sanger-tol-btk.config
diff --git a/assets/real_pdf.yaml b/assets/real_pdf.yaml
new file mode 100644
index 0000000..8f8d4a0
--- /dev/null
+++ b/assets/real_pdf.yaml
@@ -0,0 +1,45 @@
+# SAMPLE INFORMATION
+ToLID: idCulLati1
+Species: Culex laticinctus
+Sex: XX
+Submitter: Michael Paulini
+Affiliation: WSI
+Tags: ERGA-BGE
+
+# SEQUENCING DATA
+DATA:
+  - PacBio HiFi: 51x
+  - Arima v2: 152x
+
+# GENOME PROFILING DATA
+PROFILING:
+  GenomeScope:
+    version: 2.0
+    results_folder: /lustre/scratch123/tol/tolqc/data/erga-bge/insects/Culex_laticinctus/genomic_data/idCulLati1/pacbio/kmer/k31/
+
+# ASSEMBLY DATA
+ASSEMBLIES:
+  Pre-curation:
+    pipeline: [hifiasm_v0.19.8-r603|--primary, purge_dups_v1.2.5|-e,  yahs_v1.2a.2|]
+    pri:
+      gfastats--nstar-report_txt: /lustre/scratch123/tol/tolqc/data/erga-bge/insects/Culex_laticinctus/working/idCulLati1.hifiasm.20240430/scaffolding/yahs/out.break.yahs/out_scaffolds_final.fa.gz.gfastats
+      busco_short_summary_txt: /lustre/scratch123/tol/tolqc/data/erga-bge/insects/Culex_laticinctus/working/idCulLati1.hifiasm.20240430/scaffolding/yahs/out.break.yahs/out_scaffolds_final.insecta_odb10.busco/short_summary.specific.insecta_odb10.out_scaffolds_final.insecta_odb10.busco.txt
+      merqury_folder: /lustre/scratch123/tol/tolqc/data/erga-bge/insects/Culex_laticinctus/working/idCulLati1.hifiasm.20240430/scaffolding/yahs/out.break.yahs/out_scaffolds_final.ccs.merquryk/
+
+  Curated:
+    pipeline: [hifiasm_v0.19.8-r603|--primary, purge_dups_v1.2.5|-e,  yahs_v1.2a.2|, TreeVal_v1.1]
+    pri:
+      gfastats--nstar-report_txt: /lustre/scratch123/tol/tolqc/data/erga-bge/insects/Culex_laticinctus/assembly/curated/idCulLati1.1/ear/idCulLati1.1.primary.curated.fa.gfastats
+      busco_short_summary_txt: /lustre/scratch123/tol/tolqc/data/erga-bge/insects/Culex_laticinctus/assembly/curated/idCulLati1.1/ear/idCulLati1.1.primary.curated.insecta_odb10.busco/short_summary.specific.insecta_odb10.idCulLati1.1.primary.curated.insecta_odb10.busco.txt
+      merqury_folder: /lustre/scratch123/tol/tolqc/data/erga-bge/insects/Culex_laticinctus/assembly/curated/idCulLati1.1/ear/idCulLati1.1.primary.curated.ccs.merquryk/
+      hic_FullMap_png: /lustre/scratch123/tol/tolqc/data/erga-bge/insects/Culex_laticinctus/assembly/curated/idCulLati1.1/ear/idCulLati1.1_normal_snapshots/idCulLati1.1_normal_FullMap.png
+      hic_FullMap_link: https://tolqc.cog.sanger.ac.uk/erga-bge/insects/Culex_laticinctus/assembly/curated/idCulLati1.1/ear/idCulLati1.1_normal.pretext
+      blobplot_cont_png: /lustre/scratch123/tol/tolqc/data/erga-bge/insects/Culex_laticinctus/assembly/curated/idCulLati1.1/ear/idCulLati1.1_primary_curated_btk_busco.blob.circle.png
+
+# CURATION NOTES
+NOTES:
+  Obs_Haploid_num: 3
+  Obs_Sex: XX
+  Interventions_per_Gb: 430
+  Contamination_notes: "Total length of scaffolds removed: 989,717 (0.1 %)\nScaffolds removed: 1 (0.2 %)\nLargest scaffold removed: (989,717)\nFCS-GX contaminant species (number of scaffolds; total length of scaffolds):\nWolbachia endosymbiont (group B) of Melanostoma mellinum, a-proteobacteria (1; 989,717)"
+  Other_notes: "Chromosomes named by size"
diff --git a/assets/template_pdf.yaml b/assets/template_pdf.yaml
new file mode 100644
index 0000000..3779c19
--- /dev/null
+++ b/assets/template_pdf.yaml
@@ -0,0 +1,45 @@
+# SAMPLE INFORMATION
+ToLID: <SAMPLE_ID>
+Species: <LATIN_NAME>
+Sex: <EXPECTED_SEX>
+Submitter: <CURATOR>
+Affiliation: WSI
+Tags: ERGA-BGE
+
+# SEQUENCING DATA
+DATA:
+  - PacBio HiFi: <PACBIO_COVERAGE>
+  - Arima v2: <ARIMA_COVERAGE>
+
+# GENOME PROFILING DATA
+PROFILING:
+  GenomeScope:
+    version: 2.0
+    results_folder: /lustre/scratch123/tol/tolqc/data/erga-bge/insects/Culex_laticinctus/genomic_data/idCulLati1/pacbio/kmer/k31/
+
+# ASSEMBLY DATA
+ASSEMBLIES:
+  Pre-curation:
+    pipeline: [hifiasm_v0.19.8-r603|--primary, purge_dups_v1.2.5|-e,  yahs_v1.2a.2|]
+    pri:
+      gfastats--nstar-report_txt: /lustre/scratch123/tol/tolqc/data/erga-bge/insects/Culex_laticinctus/working/idCulLati1.hifiasm.20240430/scaffolding/yahs/out.break.yahs/out_scaffolds_final.fa.gz.gfastats
+      busco_short_summary_txt: /lustre/scratch123/tol/tolqc/data/erga-bge/insects/Culex_laticinctus/working/idCulLati1.hifiasm.20240430/scaffolding/yahs/out.break.yahs/out_scaffolds_final.insecta_odb10.busco/short_summary.specific.insecta_odb10.out_scaffolds_final.insecta_odb10.busco.txt
+      merqury_folder: /lustre/scratch123/tol/tolqc/data/erga-bge/insects/Culex_laticinctus/working/idCulLati1.hifiasm.20240430/scaffolding/yahs/out.break.yahs/out_scaffolds_final.ccs.merquryk/
+
+  Curated:
+    pipeline: [hifiasm_v0.19.8-r603|--primary, purge_dups_v1.2.5|-e,  yahs_v1.2a.2|, TreeVal_v1.1]
+    pri:
+      gfastats--nstar-report_txt: idCulLati1.1.primary.curated.fa.gfastats
+      busco_short_summary_txt: short_summary.specific.insecta_odb10.idCulLati1.1.primary.curated.insecta_odb10.busco.txt
+      merqury_folder: <POST_CURATION_MERQURY_FOLDER>
+      hic_FullMap_png: <CURATION_PRETEXT_PRETEXT_MAP_PNG>
+      hic_FullMap_link: https://tolqc.cog.sanger.ac.uk/erga-bge/insects/Culex_laticinctus/assembly/curated/idCulLati1.1/ear/idCulLati1.1_normal.pretext
+      blobplot_cont_png: idCulLati1.1_primary_curated_btk_busco.blob.circle.png
+
+# CURATION NOTES
+NOTES:
+  Obs_Haploid_num: <OBSERVED_HAPLOID_CHROMOSOME_COUNT>
+  Obs_Sex: <OBSERVED_SEX>
+  Interventions_per_Gb: <MANUAL_INTERVENTIONS_PER_GB>
+  Contamination_notes: "Total length of scaffolds removed: 989,717 (0.1 %)\nScaffolds removed: 1 (0.2 %)\nLargest scaffold removed: (989,717)\nFCS-GX contaminant species (number of scaffolds; total length of scaffolds):\nWolbachia endosymbiont (group B) of Melanostoma mellinum, a-proteobacteria (1; 989,717)"
+  Other_notes: "Chromosomes named by size"
diff --git a/assets/test.yaml b/assets/test.yaml
index d4da164..6a5299a 100755
--- a/assets/test.yaml
+++ b/assets/test.yaml
@@ -4,6 +4,7 @@ reference_hap2: /nfs/treeoflife-01/teams/tola/users/dp24/ascc/asccTinyTest_V2/as
 longread:
   type: hifi
   dir: /lustre/scratch123/tol/resources/treeval/treeval-testdata/TreeValSmallData/Oscheius_DF5033/genomic_data/nxOscSpes1/pacbio/fasta/
+mapped_bam: idCulLati1/mapped_bam.bam
 curationpretext:
   aligner: minimap2
   telomere_motif: TTAGG
diff --git a/conf/base.config b/conf/base.config
index 4136c84..e609a9e 100644
--- a/conf/base.config
+++ b/conf/base.config
@@ -19,6 +19,10 @@ process {
     maxRetries    = 1
     maxErrors     = '-1'
 
+    withName: "SANGER_TOL_CPRETEXT|SANGER_TOL_BTK" {
+        time    = { check_max( 70.h  * task.attempt, 'time'   ) }
+    }
+
     // Process-specific resource requirements
     // NOTE - Please try and re-use the labels below as much as possible.
     //        These labels are used and recognised by default in DSL2 files hosted on nf-core/modules.
diff --git a/conf/modules.config b/conf/modules.config
index a96a69f..137b892 100644
--- a/conf/modules.config
+++ b/conf/modules.config
@@ -12,30 +12,42 @@
 
 process {
 
-    publishDir = [
-        path: { "${params.outdir}/${task.process.tokenize(':')[-1].tokenize('_')[0].toLowerCase()}" },
-        mode: params.publish_dir_mode,
-        saveAs: { filename -> filename.equals('versions.yml') ? null : filename }
-    ]
+    withName: "GFASTATS|MERQURYFK_MERQURYFK|SANGER_TOL_BTK|SANGER_TOL_CPRETEXT" {
+        publishDir = [
+            path: { "${params.outdir}/${task.process.tokenize(':')[-1].tokenize('_')[0].toLowerCase()}" },
+            mode: params.publish_dir_mode,
+            saveAs: { filename -> filename.equals('versions.yml') ? null : filename }
+        ]
+    }
 
     withName: GFASTATS {
-        ext.args = '--nstar-report'
+        ext.args            = '--nstar-report'
     }
 
     withName: MERQURYFK_MERQURYFK {
-        ext.args        = "-P."
+        ext.args            = "-P."
     }
 
     withName: SAMTOOLS_SORT {
-        ext.prefix      = { "${meta.id}_sorted"}
+        ext.prefix          = { "${meta.id}_sorted"}
     }
 
     withName: SANGER_TOL_BTK {
-        ext.args            = "--blastx_outext 'txt'"
+        ext.pipeline_name   = "sanger-tol/blobtoolkit"
+        ext.args            = ""
         ext.executor        = "bsub -Is -tty -e test.e -o test.log -n 2 -q oversubscribed -M1400 -R'select[mem>1400] rusage[mem=1400] span[hosts=1]'"
         ext.profiles        = "singularity,sanger"
         ext.get_versions    = "lsid | head -n1 | cut -d ',' -f 1"
         ext.version         = "draft_assemblies"
     }
 
+    withName: SANGER_TOL_CPRETEXT {
+        ext.pipeline_name   = "sanger-tol/curationpretext"
+        ext.args            = ""
+        ext.executor        = "bsub -Is -tty -e test.e -o test.log -n 2 -q oversubscribed -M1400 -R'select[mem>1400] rusage[mem=1400] span[hosts=1]'"
+        ext.profiles        = "singularity,sanger"
+        ext.get_versions    = "lsid | head -n1 | cut -d ',' -f 1"
+        ext.version         = "1.0.0"
+    }
+
 }
diff --git a/conf/sanger-tol-btk.config b/conf/sanger-tol-btk.config
new file mode 100644
index 0000000..247dbbd
--- /dev/null
+++ b/conf/sanger-tol-btk.config
@@ -0,0 +1,7 @@
+process {
+    withLabel:RUN_BLASTN:BLASTN_TAXON {
+        cpus   = { check_max( 12    * task.attempt, 'cpus'    ) }
+        memory = { check_max( 10.GB * task.attempt, 'memory'  ) }
+        time   = { check_max( 16.h  * task.attempt, 'time'    ) }
+    }
+}
\ No newline at end of file
diff --git a/docs/output.md b/docs/output.md
index 335ec21..f5a9c8b 100644
--- a/docs/output.md
+++ b/docs/output.md
@@ -6,54 +6,80 @@ This document describes the output produced by the pipeline. Most of the plots a
 
 The directories listed below will be created in the results directory after the pipeline has finished. All paths are relative to the top-level results directory.
 
-<!-- TODO nf-core: Write this documentation describing your workflow's output -->
-
 ## Pipeline overview
 
 The pipeline is built using [Nextflow](https://www.nextflow.io/) and processes data using the following steps:
 
-- [FastQC](#fastqc) - Raw read QC
-- [MultiQC](#multiqc) - Aggregate report describing results and QC from the whole pipeline
+- [GFASTATS](#gfastats) - Collect statistics on the curated primary assembly
+- [MERQURYFK](#merquryfk) - Generate kmer plots for the curated assembly using previous run information
+- [SANGER_TOL_BTK](#sanger_tol_btk) - Run Blobtoolkit to generate plots and short_summary.txt from BUSCO.
+- [SANGER_TOL_CPRETEXT](#sanger_tol_cpretext) - Run Curationpretext to generate Pretext files and accessory tracks.
 - [Pipeline information](#pipeline-information) - Report metrics generated during the workflow execution
 
-### FastQC
+### GFASTATS
+
+<details markdown="1">
+<summary>Output files</summary>
+
+- `gfastats/`
+  - `*.assembly.summary`: Assembly metrics of the input primary file.
+  - `*_fasta.gz`: GZipped primary assembly file.
+
+</details>
+
+[GFASTATS](https://github.com/vgl-hub/gfastats) is a single fast and exhaustive tool for summary statistics and simultaneous *fa* (fasta, fastq, gfa [.gz]) genome assembly file manipulation.
+
+### MERQURYFK
 
 <details markdown="1">
 <summary>Output files</summary>
 
-- `fastqc/`
-  - `*_fastqc.html`: FastQC report containing quality metrics.
-  - `*_fastqc.zip`: Zip archive containing the FastQC report, tab-delimited data file and plot images.
+- `merquryfk/`
+  - `*.completeness.stats`: 
+  - `*{"primary","haplotype",""}_only.bed`:
+  - `*{"primary","haplotype",""}.qv`:
+  - `*.spectra-asm.{fl,ln,st}.png`:
+  - `*{"primary","haplotype"}.spectra-cn.{fl,ln,st}.png`:
 
 </details>
 
-[FastQC](http://www.bioinformatics.babraham.ac.uk/projects/fastqc/) gives general quality metrics about your sequenced reads. It provides information about the quality score distribution across your reads, per base sequence content (%A/T/G/C), adapter contamination and overrepresented sequences. For further reading and documentation see the [FastQC help pages](http://www.bioinformatics.babraham.ac.uk/projects/fastqc/Help/).
+[MERQURYFK](https://github.com/thegenemyers/MERQURY.FK) is a FastK based version of Merqury.
+
+Merqury is a novel tool for reference-free assembly evaluation based on efficient k-mer set operations. By comparing k-mers in a de novo assembly to those found in unassembled high-accuracy reads, Merqury estimates base-level accuracy and completeness.
+
+
+## SANGER_TOL_BTK
 
-![MultiQC - FastQC sequence counts plot](images/mqc_fastqc_counts.png)
+<details markdown="1">
+<summary>Output files</summary>
 
-![MultiQC - FastQC mean quality scores plot](images/mqc_fastqc_quality.png)
+- `sanger/*_blobtoolkit_out/`
+  - `blobtoolkit/plots/*png`: Blobtoolkit plots 
+  - `blobtoolkit/{ASSEMBLY_NAME}/*.json.gz`: Blobtoolkit dataset for use in BTK_viewer.
+  - `busco/*_odb10/*.{tsv,tar.gz,json,txt}`: Busco output
+  - `muliqc/`: MultiQC plots/data and report.html.
+  - [`pipeline_info`](#pipeline-information)
+
+</details>
 
-![MultiQC - FastQC adapter content plot](images/mqc_fastqc_adapter.png)
+[SANGER_TOL_BTK](https://pipelines.tol.sanger.ac.uk/blobtoolkit) is a bioinformatics pipeline that can be used to identify and analyse non-target DNA for eukaryotic genomes.
 
-:::note
-The FastQC plots displayed in the MultiQC report shows _untrimmed_ reads. They may contain adapter sequence and potentially regions with low quality.
-:::
 
-### MultiQC
+## SANGER_TOL_CPRETEXT
 
 <details markdown="1">
 <summary>Output files</summary>
 
-- `multiqc/`
-  - `multiqc_report.html`: a standalone HTML file that can be viewed in your web browser.
-  - `multiqc_data/`: directory containing parsed statistics from the different tools used in the pipeline.
-  - `multiqc_plots/`: directory containing static images from the report in various formats.
+- `sanger/*_curationpretext_out/`
+  - `accessory_files/*.{bigWig,bed,bedgraph}`: Track files describing Telomere, gap, coverage data across the genome. 
+  - `pretext_maps_raw`: Pre-accessory file ingestion pretext files.
+  - `pretext_maps_processed`: Post-accessory file ingestion pretext files, e.g. the final output.
+  - [`pipeline_info`](#pipeline-information)
 
 </details>
 
-[MultiQC](http://multiqc.info) is a visualization tool that generates a single HTML report summarising all samples in your project. Most of the pipeline QC results are visualised in the report and further statistics are available in the report data directory.
+[SANGER_TOL_CPRETEXT](https://pipelines.tol.sanger.ac.uk/curationpretext) is a bioinformatics pipeline typically used in conjunction with [TreeVal](https://pipelines.tol.sanger.ac.uk/treeval) to generate pretext maps (and optionally telomeric, gap, coverage, and repeat density plots which can be ingested into pretext) for the manual curation of high quality genomes.
 
-Results generated by MultiQC collate pipeline QC from supported tools e.g. FastQC. The pipeline has special steps which also allow the software versions to be reported in the MultiQC output for future traceability. For more information about how to use MultiQC reports, see <http://multiqc.info>.
 
 ### Pipeline information
 
diff --git a/docs/usage.md b/docs/usage.md
index 42521d3..b703d3e 100644
--- a/docs/usage.md
+++ b/docs/usage.md
@@ -6,60 +6,179 @@
 
 <!-- TODO nf-core: Add documentation about anything specific to running your pipeline. For general topics, please point to (and add to) the main nf-core website. -->
 
-## Samplesheet input
+## Yaml input
 
-You will need to create a samplesheet with information about the samples you would like to analyse before running the pipeline. Use this parameter to specify its location. It has to be a comma-separated file with 3 columns, and a header row as shown in the examples below.
+You will need to create a yaml with information about the samples you would like to analyse before running the pipeline. Use this parameter to specify its location.
 
 ```bash
 --input '[path to samplesheet file]'
 ```
 
-### Multiple runs of the same sample
+The structure of this file should be as follows:
 
-The `sample` identifiers have to be the same when you have re-sequenced the same sample more than once e.g. to increase sequencing depth. The pipeline will concatenate the raw reads before performing any downstream analysis. Below is an example for the same sample sequenced across 3 lanes:
+```yaml
+# General Vales for all subpiplines and modules
+assembly_id: <NAME OF ASSEMBLY>
+reference_hap1: <LOCATION OF PRIMARY ASSEMBLY FILE .FA>
+reference_hap2: <LOCATION OF HAPLOTYPE ASSEBMLY FILE .FA>
+reference_haplotigs: <LOCATION OF THE HAPLOTIGS FILE, REMOVED DURING CURATION .FA>
+
+# If a mapped bam already exists use the below + --mapped TRUE on the nextflow command else ignore it and the pipeline will create it.
+mapped_bam: <MAPPED BAM .BAM>
+
+merquryfk:
+  fastk_hist: <THE PATH TO THE .HIST FILE>
+  fastk_ktab: <PATH TO THE DIRECTORY CONTAINING THE KTAB FILES, ENSURE THE HIDDEN FILES ARE HERE TOO>
+
+# Used by both subpipelines
+longread:
+  type: <hifi|clr|ont|illumina>
+  dir: <DIRECTORY OF LONGREAD FILES .FASTA.GZ>
+curationpretext:
+  aligner: <minimap2|BWAMEM>
+  telomere_motif: <TELOMERE MOTIF OF SAMPLE>
+  hic_dir: <DIRECTORY OF HIC READ FILES .CRAM AND .CRAI>
+btk:
+  taxid: 1464561
+  lineages: <CSV LIST OF DATABASES TO USE: "insecta_odb10,diptera_odb10">
+  gca_accession: GCA_0001 <DEFAULT, DO NOT CHANGE UNLESS YOU HAVE A GCA_ACCESSION FOR YOUR SPECIES>
+  nt_database: <DIRECTORY CONTAINING BLAST DB>
+  nt_database_prefix: <BLASTDB PREFIX>
+  diamond_uniprot_database_path: <PATH TO reference_proteomes.dmnd FROM UNIPROT>
+  diamond_nr_database_path: <PATH TO nr.dmnd>
+  ncbi_taxonomy_path: <DIRECTORY CONTAINING THE TAXDUMP>
+  ncbi_rankedlineage_path: <FOLDER CONTAINING THE rankedlineage.dmp FILE>
+  config: <PATH TO ear/conf/sanger-tol-btk.config TO OVERWRITE PROCESS LIMITS>
+```
+
+## Database download and setup (Taken from sanger-tol/blobtoolkit)
+
+The BlobToolKit pipeline can be run in many different ways. The default way requires access to several databases:
+
+1. [NCBI taxdump database](https://www.ncbi.nlm.nih.gov/taxonomy)
+2. [NCBI nucleotide BLAST database](https://blast.ncbi.nlm.nih.gov/doc/blast-help/downloadblastdata.html#databases)
+3. [UniProt reference proteomes database](https://www.uniprot.org)
+4. [BUSCO database](https://busco.ezlab.org)
+
+It is a good idea to put a date suffix for each database location so you know at a glance whether you are using the latest version. We are using the `YYYY_MM` format as we do not expect the databases to be updated more frequently than once a month. However, feel free to use `DATE=YYYY_MM_DD` or a different format if you prefer.
+
+### 1. NCBI taxdump database
 
-```csv title="samplesheet.csv"
-sample,fastq_1,fastq_2
-CONTROL_REP1,AEG588A1_S1_L002_R1_001.fastq.gz,AEG588A1_S1_L002_R2_001.fastq.gz
-CONTROL_REP1,AEG588A1_S1_L003_R1_001.fastq.gz,AEG588A1_S1_L003_R2_001.fastq.gz
-CONTROL_REP1,AEG588A1_S1_L004_R1_001.fastq.gz,AEG588A1_S1_L004_R2_001.fastq.gz
+Create the database directory and move into the directory:
+
+```bash
+DATE=2023_03
+TAXDUMP=/path/to/databases/taxdump_${DATE}
+mkdir -p $TAXDUMP
+cd $TAXDUMP
 ```
 
-### Full samplesheet
+Retrieve and decompress the NCBI taxdump:
 
-The pipeline will auto-detect whether a sample is single- or paired-end using the information provided in the samplesheet. The samplesheet can have as many columns as you desire, however, there is a strict requirement for the first 3 columns to match those defined in the table below.
+```bash
+curl -L ftp://ftp.ncbi.nih.gov/pub/taxonomy/new_taxdump/new_taxdump.tar.gz | tar xzf -
+```
 
-A final samplesheet file consisting of both single- and paired-end data may look something like the one below. This is for 6 samples, where `TREATMENT_REP3` has been sequenced twice.
+### 2. NCBI nucleotide BLAST database
 
-```csv title="samplesheet.csv"
-sample,fastq_1,fastq_2
-CONTROL_REP1,AEG588A1_S1_L002_R1_001.fastq.gz,AEG588A1_S1_L002_R2_001.fastq.gz
-CONTROL_REP2,AEG588A2_S2_L002_R1_001.fastq.gz,AEG588A2_S2_L002_R2_001.fastq.gz
-CONTROL_REP3,AEG588A3_S3_L002_R1_001.fastq.gz,AEG588A3_S3_L002_R2_001.fastq.gz
-TREATMENT_REP1,AEG588A4_S4_L003_R1_001.fastq.gz,
-TREATMENT_REP2,AEG588A5_S5_L003_R1_001.fastq.gz,
-TREATMENT_REP3,AEG588A6_S6_L003_R1_001.fastq.gz,
-TREATMENT_REP3,AEG588A6_S6_L004_R1_001.fastq.gz,
+Create the database directory and move into the directory:
+
+```bash
+DATE=2023_03
+NT=/path/to/databases/nt_${DATE}
+mkdir -p $NT
+cd $NT
+```
+
+Retrieve the NCBI blast nt database (version 5) files and tar gunzip them. We are using the `&&` syntax to ensure that each command completes without error before the next one is run:
+
+```bash
+wget "ftp://ftp.ncbi.nlm.nih.gov/blast/db/v5/nt.???.tar.gz" -P $NT/ &&
+for file in $NT/*.tar.gz; do
+    tar xf $file -C $NT && rm $file;
+done
+```
+
+### 3. UniProt reference proteomes database
+
+You need [diamond blast](https://github.com/bbuchfink/diamond) installed for this step. The easiest way is probably using [conda](https://anaconda.org/bioconda/diamond). Make sure you have the latest version of Diamond (>2.x.x) otherwise the `--taxonnames` argument may not work.
+
+Create the database directory and move into the directory:
+
+```bash
+DATE=2023_03
+UNIPROT=/path/to/databases/uniprot_${DATE}
+mkdir -p $UNIPROT
+cd $UNIPROT
+```
+
+The UniProt `Refseq_Proteomes_YYYY_MM.tar.gz` file is very large (>160 GB) and will take a long time to download. The command below looks complex because it needs to get around the problem of using wildcards with wget and curl.
+
+```bash
+wget -q -O $UNIPROT/reference_proteomes.tar.gz \
+  ftp.ebi.ac.uk/pub/databases/uniprot/current_release/knowledgebase/reference_proteomes/$(curl \
+    -vs ftp.ebi.ac.uk/pub/databases/uniprot/current_release/knowledgebase/reference_proteomes/ 2>&1 | \
+    awk '/tar.gz/ {print $9}')
+tar xf reference_proteomes.tar.gz
+
+# Create a single fasta file with all the fasta files from each subdirectory:
+touch reference_proteomes.fasta.gz
+find . -mindepth 2 | grep "fasta.gz" | grep -v 'DNA' | grep -v 'additional' | xargs cat >> reference_proteomes.fasta.gz
+
+# create the accession-to-taxid map for all reference proteome sequences:
+printf "accession\taccession.version\ttaxid\tgi\n" > reference_proteomes.taxid_map
+zcat */*/*.idmapping.gz | grep "NCBI_TaxID" | awk '{print $1 "\t" $1 "\t" $3 "\t" 0}' >> reference_proteomes.taxid_map
+
+# create the taxon aware diamond blast database
+diamond makedb -p 16 --in reference_proteomes.fasta.gz --taxonmap reference_proteomes.taxid_map --taxonnodes $TAXDUMP/nodes.dmp --taxonnames $TAXDUMP/names.dmp -d reference_proteomes.dmnd
 ```
 
-| Column    | Description                                                                                                                                                                            |
-| --------- | -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| `sample`  | Custom sample name. This entry will be identical for multiple sequencing libraries/runs from the same sample. Spaces in sample names are automatically converted to underscores (`_`). |
-| `fastq_1` | Full path to FastQ file for Illumina short reads 1. File has to be gzipped and have the extension ".fastq.gz" or ".fq.gz".                                                             |
-| `fastq_2` | Full path to FastQ file for Illumina short reads 2. File has to be gzipped and have the extension ".fastq.gz" or ".fq.gz".                                                             |
+### 4. BUSCO databases
+
+Create the database directory and move into the directory:
+
+```bash
+DATE=2023_03
+BUSCO=/path/to/databases/busco_${DATE}
+mkdir -p $BUSCO
+cd $BUSCO
+```
+
+Download BUSCO data and lineages to allow BUSCO to run in offline mode:
+
+```bash
+wget -r -nH https://busco-data.ezlab.org/v5/data/
+# the trailing slash after data is important. Otherwise wget doesn't get the subdirectories
+
+# tar gunzip all folders that have been stored as tar.gz, in the same parent directories as where they were stored:
+find v5/data -name "*.tar.gz" | while read -r TAR; do tar -C `dirname $TAR` -xzf $TAR; done
+```
+
+If you have [GNU parallel](https://www.gnu.org/software/parallel/) installed, you can also use the command below which will run faster as it will run the decompression commands in parallel:
+
+```bash
+find v5/data -name "*.tar.gz" | parallel "cd {//}; tar -xzf {/}"
+```
+
+## Blobtoolkit - YAML File and Nextflow configuration
+
+As in the Snakemake version [a YAML configuration file](https://github.com/blobtoolkit/blobtoolkit/tree/main/src/blobtoolkit-pipeline/src#configuration) is needed to generate metadata summary. This YAML config file can be generated with a genome accession value for released assemblies (for example, GCA_XXXXXXXXX.X) or can be passed for draft assemblies (for example, [GCA_922984935.2.yaml](assets/test/GCA_922984935.2.yaml) using the `--yaml` parameter. Even for draft assemblies, a placeholder value should be passed with the `--accession` parameter.
+
+The data in the YAML is currently ignored in the Nextflow pipeline version. The YAML file is retained only to allow compatibility with the BlobDir dataset generated by the [Snakemake version](https://github.com/blobtoolkit/blobtoolkit/tree/main/src/blobtoolkit-pipeline/src). The taxonomic information in the YAML file can be obtained from [NCBI Taxonomy](https://www.ncbi.nlm.nih.gov/data-hub/taxonomy/).
 
-An [example samplesheet](../assets/samplesheet.csv) has been provided with the pipeline.
 
 ## Running the pipeline
 
 The typical command for running the pipeline is as follows:
 
 ```bash
-nextflow run sanger-tol/ear --input ./samplesheet.csv --outdir ./results --genome GRCh37 -profile docker
+nextflow run sanger-tol/ear --input assets/test.yaml --outdir ./results  -profile docker
 ```
 
 This will launch the pipeline with the `docker` configuration profile. See below for more information about profiles.
 
+> Please note that conda is not supported for all tools in use for this pipeline, this limits use to docker or singularity
+
 Note that the pipeline will create the following files in your working directory:
 
 ```bash
@@ -77,23 +196,6 @@ Pipeline settings can be provided in a `yaml` or `json` file via `-params-file <
 Do not use `-c <file>` to specify parameters as this will result in errors. Custom config files specified with `-c` must only be used for [tuning process resource specifications](https://nf-co.re/docs/usage/configuration#tuning-workflow-resources), other infrastructural tweaks (such as output directories), or module arguments (args).
 :::
 
-The above pipeline run specified with a params file in yaml format:
-
-```bash
-nextflow run sanger-tol/ear -profile docker -params-file params.yaml
-```
-
-with `params.yaml` containing:
-
-```yaml
-input: './samplesheet.csv'
-outdir: './results/'
-genome: 'GRCh37'
-<...>
-```
-
-You can also generate such `YAML`/`JSON` files via [nf-core/launch](https://nf-co.re/launch).
-
 ### Updating the pipeline
 
 When you run the above command, Nextflow automatically pulls the pipeline code from GitHub and stores it as a cached version. When running the pipeline after this, it will always use the cached version if available - even if the pipeline has been updated since. To make sure that you're running the latest version of the pipeline, make sure that you regularly update the cached version of the pipeline:
diff --git a/main.nf b/main.nf
index 3b7bca7..1e4ece0 100644
--- a/main.nf
+++ b/main.nf
@@ -29,7 +29,7 @@ include { EAR  } from './workflows/ear'
 workflow SANGERTOL_EAR {
 
     take:
-    samplesheet // channel: samplesheet read in from --input
+    input_yaml // channel: input_yaml read in from --input
 
     main:
 
@@ -37,7 +37,7 @@ workflow SANGERTOL_EAR {
     // WORKFLOW: Run pipeline
     //
     EAR (
-        samplesheet
+        input_yaml
     )
 
 
diff --git a/modules.json b/modules.json
index 3b0db89..23ee7d4 100644
--- a/modules.json
+++ b/modules.json
@@ -5,45 +5,41 @@
         "https://github.com/nf-core/modules.git": {
             "modules": {
                 "nf-core": {
-                    "busco/busco": {
-                        "branch": "master",
-                        "git_sha": "17486961b8b1ab1aae258c83a7e947b40d8ab670",
-                        "installed_by": ["modules"]
-                    },
-                    "fastqc": {
-                        "branch": "master",
-                        "git_sha": "285a50500f9e02578d90b3ce6382ea3c30216acd",
-                        "installed_by": ["modules"]
-                    },
                     "gfastats": {
                         "branch": "master",
                         "git_sha": "3f5420aa22e00bd030a2556dfdffc9e164ec0ec5",
-                        "installed_by": ["modules"]
+                        "installed_by": [
+                            "modules"
+                        ]
                     },
                     "merquryfk/merquryfk": {
                         "branch": "master",
                         "git_sha": "3f5420aa22e00bd030a2556dfdffc9e164ec0ec5",
-                        "installed_by": ["modules"]
+                        "installed_by": [
+                            "modules"
+                        ],
+                        "patch": "modules/nf-core/merquryfk/merquryfk/merquryfk-merquryfk.diff"
                     },
                     "minimap2/align": {
                         "branch": "master",
                         "git_sha": "a33ef9475558c6b8da08c5f522ddaca1ec810306",
-                        "installed_by": ["modules"]
-                    },
-                    "multiqc": {
-                        "branch": "master",
-                        "git_sha": "b7ebe95761cd389603f9cc0e0dc384c0f663815a",
-                        "installed_by": ["modules"]
+                        "installed_by": [
+                            "modules"
+                        ]
                     },
                     "samtools/merge": {
                         "branch": "master",
                         "git_sha": "04fbbc7c43cebc0b95d5b126f6d9fe4effa33519",
-                        "installed_by": ["modules"]
+                        "installed_by": [
+                            "modules"
+                        ]
                     },
                     "samtools/sort": {
                         "branch": "master",
                         "git_sha": "46eca555142d6e597729fcb682adcc791796f514",
-                        "installed_by": ["modules"]
+                        "installed_by": [
+                            "modules"
+                        ]
                     }
                 }
             },
@@ -52,20 +48,26 @@
                     "utils_nextflow_pipeline": {
                         "branch": "master",
                         "git_sha": "5caf7640a9ef1d18d765d55339be751bb0969dfa",
-                        "installed_by": ["subworkflows"]
+                        "installed_by": [
+                            "subworkflows"
+                        ]
                     },
                     "utils_nfcore_pipeline": {
                         "branch": "master",
                         "git_sha": "92de218a329bfc9a9033116eb5f65fd270e72ba3",
-                        "installed_by": ["subworkflows"]
+                        "installed_by": [
+                            "subworkflows"
+                        ]
                     },
                     "utils_nfvalidation_plugin": {
                         "branch": "master",
                         "git_sha": "5caf7640a9ef1d18d765d55339be751bb0969dfa",
-                        "installed_by": ["subworkflows"]
+                        "installed_by": [
+                            "subworkflows"
+                        ]
                     }
                 }
             }
         }
     }
-}
+}
\ No newline at end of file
diff --git a/modules/local/sanger_tol_btk.nf b/modules/local/sanger_tol_btk.nf
index 27e3ca0..6ce9191 100644
--- a/modules/local/sanger_tol_btk.nf
+++ b/modules/local/sanger_tol_btk.nf
@@ -7,46 +7,49 @@ process SANGER_TOL_BTK {
     tuple val(meta1), path(bam) // Name needs to remain the same as previous process as they are referenced in the samplesheet
     tuple val(meta2), path(samplesheet_csv, stageAs: "SAMPLESHEET.csv")
     path blastp, stageAs: "blastp.dmnd"
-    path blastn
+    path blastn, stageAs: ""
     path blastx
-    path btk_config_file
+    path config_file
     path tax_dump
-    path btk_yaml, stageAs: "BTK.yaml"
     val busco_lineages
     val taxon
     val gca_accession
 
     output:
-    tuple val(meta), path("${meta.id}_btk_out/blobtoolkit/REFERENCE"),      emit: dataset
-    path("${meta.id}_btk_out/blobtoolkit/plots"),                           emit: plots
-    path("${meta.id}_btk_out/blobtoolkit/REFERENCE/summary.json.gz"),     emit: summary_json
-    path("${meta.id}_btk_out/busco"),                                       emit: busco_data
-    path("${meta.id}_btk_out/multiqc"),                                     emit: multiqc_report
-    path("blobtoolkit_pipeline_info"),                                      emit: pipeline_info
-    path "versions.yml",                                                    emit: versions
+    tuple val(meta), path("*_out/blobtoolkit/REFERENCE"),      emit: dataset
+    path("*_out/blobtoolkit/plots"),                           emit: plots
+    path("*_out/blobtoolkit/REFERENCE/summary.json.gz"),       emit: summary_json
+    path("*_out/busco"),                                       emit: busco_data
+    path("*_out/multiqc"),                                     emit: multiqc_report
+    path("*_out/blobtoolkit_pipeline_info"),                   emit: pipeline_info
+    path "versions.yml",                                       emit: versions
 
     script:
-    def args                =   task.ext.args           ?:  ""
-    def executor            =   task.ext.executor       ?:  ""
-    def profiles            =   task.ext.profiles       ?:  ""
-    def get_version         =   task.ext.version_data   ?:  "UNKNOWN - SETTING NOT SET"
-    def btk_config          =   btk_config_file         ? "-c $btk_config_file"         : ""
-    def pipeline_version    =   task.ext.version        ?: "draft_assemblies"
-    // YAML used to avoid the use of GCA accession number
-    //    https://github.com/sanger-tol/blobtoolkit/issues/77
+    def pipeline_name                       =   task.ext.pipeline_name
+    def (pipeline_prefix,pipeline_suffix)   =   pipeline_name.split('/')
+    def output_dir                          =   "${meta.id}_${pipeline_suffix}_out"
+    def args                                =   task.ext.args           ?:  ""
+    def executor                            =   task.ext.executor       ?:  ""
+    def profiles                            =   task.ext.profiles       ?:  ""
+    def get_version                         =   task.ext.version_data   ?:  "UNKNOWN - SETTING NOT SET"
+    def config                              =   config_file             ? "-c $config_file"         : ""
+    def pipeline_version                    =   task.ext.version        ?: "main"
 
     // Seems to be an issue where a nested pipeline can't see the files in the same directory
     // Running realpath gets around this but the files copied into the folder are
     // now just wasted space. Should be fixed with using Mahesh's method of nesting but
     // this is proving a bit complicated with BTK
 
-    // outdir should be an arg
-
     // blastx and blastp can use the same database hence the StageAs
 
+    // Running these as unique jobs means we don't have to worry about multiple pipeline
+    // head jobs running in the same initial Nextflow head, this balloons memory
+    // for LSF we can use -Is -tty to keep the output of this sub-pipeline in
+    // terminal, keeping the job open until the pipeline completes
 
+    // the printf statement appends the subpipelines versions file to the main versions file
     """
-    $executor 'nextflow run sanger-tol/blobtoolkit \\
+    $executor 'nextflow run $pipeline_name \\
         -r $pipeline_version \\
         -profile  $profiles \\
         --input "\$(realpath $samplesheet_csv)" \\
@@ -58,10 +61,9 @@ process SANGER_TOL_BTK {
         --blastp "\$(realpath blastp.dmnd)" \\
         --blastn "\$(realpath $blastn)" \\
         --blastx "\$(realpath $blastx)" \\
-        $btk_config \\
-        $args'
-
-    mv ${meta.id}_btk_out/pipeline_info blobtoolkit_pipeline_info
+        $config \\
+        $args \\
+        -resume'
 
     cat <<-END_VERSIONS > versions.yml
     "${task.process}":
@@ -69,10 +71,12 @@ process SANGER_TOL_BTK {
         Nextflow: \$(nextflow -v | cut -d " " -f3)
         executor system: $get_version
     END_VERSIONS
+
+    printf "%s/t" <${output_dir}/pipeline_info/software_version.yml >> versions.yml
     """
 
     stub:
-    def pipeline_version    =   task.ext.version        ?: "draft_assemblies"
+    def pipeline_version    =   task.ext.version        ?: "main"
 
     """
     mkdir -p ${meta.id}_btk_out/blobtoolkit/${meta.id}_out
diff --git a/modules/local/sanger_tol_cpretext.nf b/modules/local/sanger_tol_cpretext.nf
new file mode 100644
index 0000000..5b986e1
--- /dev/null
+++ b/modules/local/sanger_tol_cpretext.nf
@@ -0,0 +1,74 @@
+process SANGER_TOL_CPRETEXT {
+    tag "$reference"
+    label 'process_low'
+
+    input:
+    path(reference)
+    path(longread_dir)
+    path(cram_dir)
+    path(config_file)
+
+    output:
+    tuple val(reference), path("*_out/*"),  emit: dataset
+    path "versions.yml",                    emit: versions
+
+    script:
+    def pipeline_name                       =   task.ext.pipeline_name
+    def (pipeline_prefix,pipeline_suffix)   =   pipeline_name.split('/')
+    def output_dir                          =   "${reference}_${pipeline_suffix}_out"
+    def args                                =   task.ext.args               ?:  ""
+    def executor                            =   task.ext.executor           ?:  ""
+    def profiles                            =   task.ext.profiles           ?:  ""
+    def get_version                         =   task.ext.version_data       ?:  "UNKNOWN - SETTING NOT SET"
+    def config                              =   config_file                 ? "-c $config_file"         : ""
+    def pipeline_version                    =   task.ext.version            ?: "main"
+
+    // Seems to be an issue where a nested pipeline can't see the files in the same directory
+    // Running realpath gets around this but the files copied into the folder are
+    // now just wasted space. Should be fixed with using Mahesh's method of nesting but
+    // this is proving a bit complicated with BTK
+
+    // Running these as unique jobs means we don't have to worry about multiple pipeline
+    // head jobs running in the same initial Nextflow head, this balloons memory
+    // for LSF we can use -Is -tty to keep the output of this sub-pipeline in
+    // terminal, keeping the job open until the pipeline completes
+
+    // the printf statement appends the subpipelines versions file to the main versions file
+    """
+    $executor 'nextflow run $pipeline_name \\
+        -r $pipeline_version \\
+        -profile  $profiles \\
+        --input "\$(realpath $reference)" \\
+        --outdir $output_dir \\
+        --longread "\$(realpath $longread_dir)" \\
+        --cram "\$(realpath $cram_dir)" \\
+        $args \\
+        $config \\
+        -resume'
+    
+    cat <<-END_VERSIONS > versions.yml
+    "${task.process}":
+        $pipeline_suffix: $pipeline_version
+        Nextflow: \$(nextflow -v | cut -d " " -f3)
+        executor system: $get_version
+    END_VERSIONS
+
+    printf "%s/t" <${output_dir}/pipeline_info/software_version.yml >> versions.yml
+    """
+
+    stub:
+    def pipeline_version                    =   task.ext.version        ?: "main"
+    def (pipeline_prefix,pipeline_suffix)   =   pipeline_name.split('/')
+    def output_dir                          =   "${reference}_${pipeline_suffix}_out"
+    """
+    mkdir ${output_dir}
+    touch ${output_dir}/reference.txt
+
+    cat <<-END_VERSIONS > versions.yml
+    "${task.process}":
+        $pipeline_suffix: $pipeline_version
+        Nextflow: \$(nextflow -v | cut -d " " -f3)
+        executor system: $get_version
+    END_VERSIONS
+    """
+}
diff --git a/modules/nf-core/busco/busco/environment.yml b/modules/nf-core/busco/busco/environment.yml
deleted file mode 100644
index 06a5d93..0000000
--- a/modules/nf-core/busco/busco/environment.yml
+++ /dev/null
@@ -1,7 +0,0 @@
-name: busco_busco
-channels:
-  - conda-forge
-  - bioconda
-  - defaults
-dependencies:
-  - bioconda::busco=5.7.1
diff --git a/modules/nf-core/busco/busco/main.nf b/modules/nf-core/busco/busco/main.nf
deleted file mode 100644
index f7c1a66..0000000
--- a/modules/nf-core/busco/busco/main.nf
+++ /dev/null
@@ -1,107 +0,0 @@
-process BUSCO_BUSCO {
-    tag "$meta.id"
-    label 'process_medium'
-
-    conda "${moduleDir}/environment.yml"
-    container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ?
-        'https://depot.galaxyproject.org/singularity/busco:5.7.1--pyhdfd78af_0':
-        'biocontainers/busco:5.7.1--pyhdfd78af_0' }"
-
-    input:
-    tuple val(meta), path(fasta, stageAs:'tmp_input/*')
-    val mode                              // Required:    One of genome, proteins, or transcriptome
-    val lineage                           // Required:    lineage to check against, "auto" enables --auto-lineage instead
-    path busco_lineages_path              // Recommended: path to busco lineages - downloads if not set
-    path config_file                      // Optional:    busco configuration file
-
-    output:
-    tuple val(meta), path("*-busco.batch_summary.txt")                , emit: batch_summary
-    tuple val(meta), path("short_summary.*.txt")                      , emit: short_summaries_txt   , optional: true
-    tuple val(meta), path("short_summary.*.json")                     , emit: short_summaries_json  , optional: true
-    tuple val(meta), path("*-busco/*/run_*/full_table.tsv")           , emit: full_table            , optional: true
-    tuple val(meta), path("*-busco/*/run_*/missing_busco_list.tsv")   , emit: missing_busco_list    , optional: true
-    tuple val(meta), path("*-busco/*/run_*/single_copy_proteins.faa") , emit: single_copy_proteins  , optional: true
-    tuple val(meta), path("*-busco/*/run_*/busco_sequences")          , emit: seq_dir
-    tuple val(meta), path("*-busco/*/translated_proteins")            , emit: translated_dir        , optional: true
-    tuple val(meta), path("*-busco")                                  , emit: busco_dir
-    path "versions.yml"                                               , emit: versions
-
-    when:
-    task.ext.when == null || task.ext.when
-
-    script:
-    if ( mode !in [ 'genome', 'proteins', 'transcriptome' ] ) {
-        error "Mode must be one of 'genome', 'proteins', or 'transcriptome'."
-    }
-    def args = task.ext.args ?: ''
-    def prefix = task.ext.prefix ?: "${meta.id}-${lineage}"
-    def busco_config = config_file ? "--config $config_file" : ''
-    def busco_lineage = lineage.equals('auto') ? '--auto-lineage' : "--lineage_dataset ${lineage}"
-    def busco_lineage_dir = busco_lineages_path ? "--download_path ${busco_lineages_path}" : ''
-    """
-    # Nextflow changes the container --entrypoint to /bin/bash (container default entrypoint: /usr/local/env-execute)
-    # Check for container variable initialisation script and source it.
-    if [ -f "/usr/local/env-activate.sh" ]; then
-        set +u  # Otherwise, errors out because of various unbound variables
-        . "/usr/local/env-activate.sh"
-        set -u
-    fi
-
-    # If the augustus config directory is not writable, then copy to writeable area
-    if [ ! -w "\${AUGUSTUS_CONFIG_PATH}" ]; then
-        # Create writable tmp directory for augustus
-        AUG_CONF_DIR=\$( mktemp -d -p \$PWD )
-        cp -r \$AUGUSTUS_CONFIG_PATH/* \$AUG_CONF_DIR
-        export AUGUSTUS_CONFIG_PATH=\$AUG_CONF_DIR
-        echo "New AUGUSTUS_CONFIG_PATH=\${AUGUSTUS_CONFIG_PATH}"
-    fi
-
-    # Ensure the input is uncompressed
-    INPUT_SEQS=input_seqs
-    mkdir "\$INPUT_SEQS"
-    cd "\$INPUT_SEQS"
-    for FASTA in ../tmp_input/*; do
-        if [ "\${FASTA##*.}" == 'gz' ]; then
-            gzip -cdf "\$FASTA" > \$( basename "\$FASTA" .gz )
-        else
-            ln -s "\$FASTA" .
-        fi
-    done
-    cd ..
-
-    busco \\
-        --cpu $task.cpus \\
-        --in "\$INPUT_SEQS" \\
-        --out ${prefix}-busco \\
-        --mode $mode \\
-        $busco_lineage \\
-        $busco_lineage_dir \\
-        $busco_config \\
-        $args
-
-    # clean up
-    rm -rf "\$INPUT_SEQS"
-
-    # Move files to avoid staging/publishing issues
-    mv ${prefix}-busco/batch_summary.txt ${prefix}-busco.batch_summary.txt
-    mv ${prefix}-busco/*/short_summary.*.{json,txt} . || echo "Short summaries were not available: No genes were found."
-
-    cat <<-END_VERSIONS > versions.yml
-    "${task.process}":
-        busco: \$( busco --version 2>&1 | sed 's/^BUSCO //' )
-    END_VERSIONS
-    """
-
-    stub:
-    def prefix      = task.ext.prefix ?: "${meta.id}-${lineage}"
-    def fasta_name  = files(fasta).first().name - '.gz'
-    """
-    touch ${prefix}-busco.batch_summary.txt
-    mkdir -p ${prefix}-busco/$fasta_name/run_${lineage}/busco_sequences
-
-    cat <<-END_VERSIONS > versions.yml
-    "${task.process}":
-        busco: \$( busco --version 2>&1 | sed 's/^BUSCO //' )
-    END_VERSIONS
-    """
-}
diff --git a/modules/nf-core/busco/busco/meta.yml b/modules/nf-core/busco/busco/meta.yml
deleted file mode 100644
index 29745d2..0000000
--- a/modules/nf-core/busco/busco/meta.yml
+++ /dev/null
@@ -1,98 +0,0 @@
-name: busco_busco
-description: Benchmarking Universal Single Copy Orthologs
-keywords:
-  - quality control
-  - genome
-  - transcriptome
-  - proteome
-tools:
-  - busco:
-      description: BUSCO provides measures for quantitative assessment of genome assembly, gene set, and transcriptome completeness based on evolutionarily informed expectations of gene content from near-universal single-copy orthologs selected from OrthoDB.
-      homepage: https://busco.ezlab.org/
-      documentation: https://busco.ezlab.org/busco_userguide.html
-      tool_dev_url: https://gitlab.com/ezlab/busco
-      doi: "10.1007/978-1-4939-9173-0_14"
-      licence: ["MIT"]
-input:
-  - meta:
-      type: map
-      description: |
-        Groovy Map containing sample information
-        e.g. [ id:'test', single_end:false ]
-  - fasta:
-      type: file
-      description: Nucleic or amino acid sequence file in FASTA format.
-      pattern: "*.{fasta,fna,fa,fasta.gz,fna.gz,fa.gz}"
-  - mode:
-      type: string
-      description: The mode to run Busco in. One of genome, proteins, or transcriptome
-      pattern: "{genome,proteins,transcriptome}"
-  - lineage:
-      type: string
-      description: The BUSCO lineage to use, or "auto" to automatically select lineage
-  - busco_lineages_path:
-      type: directory
-      description: Path to local BUSCO lineages directory.
-  - config_file:
-      type: file
-      description: Path to BUSCO config file.
-output:
-  - meta:
-      type: map
-      description: |
-        Groovy Map containing sample information
-        e.g. [ id:'test', single_end:false ]
-  - batch_summary:
-      type: file
-      description: Summary of all sequence files analyzed
-      pattern: "*-busco.batch_summary.txt"
-  - short_summaries_txt:
-      type: file
-      description: Short Busco summary in plain text format
-      pattern: "short_summary.*.txt"
-  - short_summaries_json:
-      type: file
-      description: Short Busco summary in JSON format
-      pattern: "short_summary.*.json"
-  - busco_dir:
-      type: directory
-      description: BUSCO lineage specific output
-      pattern: "*-busco"
-  - full_table:
-      type: file
-      description: Full BUSCO results table
-      pattern: "full_table.tsv"
-  - missing_busco_list:
-      type: file
-      description: List of missing BUSCOs
-      pattern: "missing_busco_list.tsv"
-  - single_copy_proteins:
-      type: file
-      description: Fasta file of single copy proteins (transcriptome mode)
-      pattern: "single_copy_proteins.faa"
-  - seq_dir:
-      type: directory
-      description: BUSCO sequence directory
-      pattern: "busco_sequences"
-  - translated_dir:
-      type: directory
-      description: Six frame translations of each transcript made by the transcriptome mode
-      pattern: "translated_dir"
-  - versions:
-      type: file
-      description: File containing software versions
-      pattern: "versions.yml"
-authors:
-  - "@priyanka-surana"
-  - "@charles-plessy"
-  - "@mahesh-panchal"
-  - "@muffato"
-  - "@jvhagey"
-  - "@gallvp"
-maintainers:
-  - "@priyanka-surana"
-  - "@charles-plessy"
-  - "@mahesh-panchal"
-  - "@muffato"
-  - "@jvhagey"
-  - "@gallvp"
diff --git a/modules/nf-core/busco/busco/tests/main.nf.test b/modules/nf-core/busco/busco/tests/main.nf.test
deleted file mode 100644
index 16b708b..0000000
--- a/modules/nf-core/busco/busco/tests/main.nf.test
+++ /dev/null
@@ -1,419 +0,0 @@
-nextflow_process {
-
-    name "Test Process BUSCO_BUSCO"
-    script "../main.nf"
-    process "BUSCO_BUSCO"
-
-    tag "modules"
-    tag "modules_nfcore"
-    tag "busco"
-    tag "busco/busco"
-
-    test("test_busco_genome_single_fasta") {
-
-        config './nextflow.config'
-
-        when {
-            process {
-                """
-                input[0] = [
-                    [ id:'test' ], // meta map
-                    file( params.test_data['bacteroides_fragilis']['genome']['genome_fna_gz'], checkIfExists: true)
-                ]
-                input[1] = 'genome'
-                input[2] = 'bacteria_odb10' // Launch with 'auto' to use --auto-lineage, and specified lineages // 'auto' removed from test due to memory issues
-                input[3] = [] // Download busco lineage
-                input[4] = [] // No config
-                """
-            }
-        }
-
-        then {
-            assert process.success
-
-            with(path(process.out.short_summaries_txt[0][1]).text) {
-                assert contains('BUSCO version')
-                assert contains('The lineage dataset is')
-                assert contains('BUSCO was run in mode')
-                assert contains('Complete BUSCOs')
-                assert contains('Missing BUSCOs')
-                assert contains('Dependencies and versions')
-            }
-
-            with(path(process.out.short_summaries_json[0][1]).text) {
-                assert contains('one_line_summary')
-                assert contains('mode')
-                assert contains('dataset')
-            }
-
-            assert snapshot(
-                    process.out.batch_summary[0][1],
-                    process.out.full_table[0][1],
-                    process.out.missing_busco_list[0][1],
-                    process.out.versions[0]
-                ).match()
-
-            with(file(process.out.seq_dir[0][1]).listFiles().collect { it.name }) {
-                assert contains('single_copy_busco_sequences.tar.gz')
-                assert contains('multi_copy_busco_sequences.tar.gz')
-                assert contains('fragmented_busco_sequences.tar.gz')
-            }
-
-            with(path("${process.out.busco_dir[0][1]}/logs/busco.log").text) {
-                assert contains('DEBUG:busco.run_BUSCO')
-                assert contains('Results from dataset')
-                assert contains('how to cite BUSCO')
-            }
-
-            assert process.out.single_copy_proteins == []
-            assert process.out.translated_dir == []
-        }
-    }
-
-    test("test_busco_genome_multi_fasta") {
-
-        config './nextflow.config'
-
-        when {
-            process {
-                """
-                input[0] = [
-                    [ id:'test' ], // meta map
-                    [
-                        file( params.test_data['bacteroides_fragilis']['genome']['genome_fna_gz'], checkIfExists: true),
-                        file( params.test_data['candidatus_portiera_aleyrodidarum']['genome']['genome_fasta'], checkIfExists: true)
-                    ]
-                ]
-                input[1] = 'genome'
-                input[2] = 'bacteria_odb10'
-                input[3] = []
-                input[4] = []
-                """
-            }
-        }
-
-        then {
-            assert process.success
-
-            with(path(process.out.short_summaries_txt[0][1][0]).text) {
-                assert contains('BUSCO version')
-                assert contains('The lineage dataset is')
-                assert contains('BUSCO was run in mode')
-                assert contains('Complete BUSCOs')
-                assert contains('Missing BUSCOs')
-                assert contains('Dependencies and versions')
-            }
-
-            with(path(process.out.short_summaries_txt[0][1][1]).text) {
-                assert contains('BUSCO version')
-                assert contains('The lineage dataset is')
-                assert contains('BUSCO was run in mode')
-                assert contains('Complete BUSCOs')
-                assert contains('Missing BUSCOs')
-                assert contains('Dependencies and versions')
-            }
-
-            with(path(process.out.short_summaries_json[0][1][0]).text) {
-                assert contains('one_line_summary')
-                assert contains('mode')
-                assert contains('dataset')
-            }
-
-            with(path(process.out.short_summaries_json[0][1][1]).text) {
-                assert contains('one_line_summary')
-                assert contains('mode')
-                assert contains('dataset')
-            }
-
-            assert snapshot(
-                    process.out.batch_summary[0][1],
-                    process.out.full_table[0][1],
-                    process.out.missing_busco_list[0][1],
-                    process.out.versions[0]
-                ).match()
-
-            with(file(process.out.seq_dir[0][1][0]).listFiles().collect { it.name }) {
-                assert contains('single_copy_busco_sequences.tar.gz')
-                assert contains('multi_copy_busco_sequences.tar.gz')
-                assert contains('fragmented_busco_sequences.tar.gz')
-            }
-
-            with(file(process.out.seq_dir[0][1][1]).listFiles().collect { it.name }) {
-                assert contains('single_copy_busco_sequences.tar.gz')
-                assert contains('multi_copy_busco_sequences.tar.gz')
-                assert contains('fragmented_busco_sequences.tar.gz')
-            }
-
-            with(path("${process.out.busco_dir[0][1]}/logs/busco.log").text) {
-                assert contains('DEBUG:busco.run_BUSCO')
-                assert contains('Results from dataset')
-                assert contains('how to cite BUSCO')
-            }
-
-            assert process.out.single_copy_proteins == []
-            assert process.out.translated_dir == []
-        }
-
-    }
-
-    test("test_busco_eukaryote_metaeuk") {
-
-        config './nextflow.metaeuk.config'
-
-        when {
-            process {
-                """
-                input[0] = [
-                    [ id:'test' ], // meta map
-                    file( params.test_data['homo_sapiens']['genome']['genome_fasta'], checkIfExists: true)
-                ]
-                input[1] = 'genome'
-                input[2] = 'eukaryota_odb10'
-                input[3] = []
-                input[4] = []
-                """
-            }
-        }
-
-        then {
-            assert process.success
-
-            with(path(process.out.short_summaries_txt[0][1]).text) {
-                assert contains('BUSCO version')
-                assert contains('The lineage dataset is')
-                assert contains('BUSCO was run in mode')
-                assert contains('Complete BUSCOs')
-                assert contains('Missing BUSCOs')
-                assert contains('Dependencies and versions')
-            }
-
-            with(path(process.out.short_summaries_json[0][1]).text) {
-                assert contains('one_line_summary')
-                assert contains('mode')
-                assert contains('dataset')
-            }
-
-            assert snapshot(
-                    process.out.batch_summary[0][1],
-                    process.out.full_table[0][1],
-                    process.out.missing_busco_list[0][1],
-                    process.out.versions[0]
-                ).match()
-
-            with(file(process.out.seq_dir[0][1]).listFiles().collect { it.name }) {
-                assert contains('single_copy_busco_sequences.tar.gz')
-                assert contains('multi_copy_busco_sequences.tar.gz')
-                assert contains('fragmented_busco_sequences.tar.gz')
-            }
-
-            with(path("${process.out.busco_dir[0][1]}/logs/busco.log").text) {
-                assert contains('DEBUG:busco.run_BUSCO')
-                assert contains("'use_augustus', 'False'")
-                assert contains("'use_metaeuk', 'True'") // METAEUK
-                assert contains('Results from dataset')
-                assert contains('how to cite BUSCO')
-
-            }
-
-            assert process.out.single_copy_proteins == []
-            assert process.out.translated_dir == []
-        }
-
-    }
-
-    test("test_busco_eukaryote_augustus") {
-
-        config './nextflow.augustus.config'
-
-        when {
-            process {
-                """
-                input[0] = [
-                    [ id:'test' ], // meta map
-                    file( params.test_data['homo_sapiens']['genome']['genome_fasta'], checkIfExists: true)
-                ]
-                input[1] = 'genome'
-                input[2] = 'eukaryota_odb10'
-                input[3] = []
-                input[4] = []
-                """
-            }
-        }
-
-        then {
-            assert process.success
-
-            assert snapshot(
-                    process.out.batch_summary[0][1],
-                    process.out.versions[0]
-                ).match()
-
-            with(path("${process.out.busco_dir[0][1]}/logs/busco.log").text) {
-                assert contains('DEBUG:busco.run_BUSCO')
-                assert contains("'use_augustus', 'True'")
-                assert contains("'use_metaeuk', 'False'") // AUGUSTUS
-                assert contains('Augustus did not recognize any genes')
-
-            }
-
-            assert process.out.short_summaries_json == []
-            assert process.out.short_summaries_txt == []
-            assert process.out.missing_busco_list == []
-            assert process.out.full_table == []
-            assert process.out.single_copy_proteins == []
-            assert process.out.translated_dir == []
-        }
-
-    }
-
-    test("test_busco_protein") {
-
-        config './nextflow.config'
-
-        when {
-            process {
-                """
-                input[0] = [
-                    [ id:'test' ], // meta map
-                    file( params.test_data['candidatus_portiera_aleyrodidarum']['genome']['proteome_fasta'], checkIfExists: true)
-                ]
-                input[1] = 'proteins'
-                input[2] = 'bacteria_odb10'
-                input[3] = []
-                input[4] = []
-                """
-            }
-        }
-
-        then {
-            assert process.success
-
-            with(path(process.out.short_summaries_txt[0][1]).text) {
-                assert contains('BUSCO version')
-                assert contains('The lineage dataset is')
-                assert contains('BUSCO was run in mode')
-                assert contains('Complete BUSCOs')
-                assert contains('Missing BUSCOs')
-                assert contains('Dependencies and versions')
-            }
-
-            with(path(process.out.short_summaries_json[0][1]).text) {
-                assert contains('one_line_summary')
-                assert contains('mode')
-                assert contains('dataset')
-            }
-
-            assert snapshot(
-                    process.out.batch_summary[0][1],
-                    process.out.full_table[0][1],
-                    process.out.missing_busco_list[0][1],
-                    process.out.versions[0]
-                ).match()
-
-            with(file(process.out.seq_dir[0][1]).listFiles().collect { it.name }) {
-                assert contains('single_copy_busco_sequences.tar.gz')
-                assert contains('multi_copy_busco_sequences.tar.gz')
-                assert contains('fragmented_busco_sequences.tar.gz')
-            }
-
-            with(path("${process.out.busco_dir[0][1]}/logs/busco.log").text) {
-                assert contains('DEBUG:busco.run_BUSCO')
-                assert contains('Results from dataset')
-                assert contains('how to cite BUSCO')
-            }
-
-            assert process.out.single_copy_proteins == []
-            assert process.out.translated_dir == []
-        }
-
-    }
-
-    test("test_busco_transcriptome") {
-
-        config './nextflow.config'
-
-        when {
-            process {
-                """
-                input[0] = [
-                    [ id:'test' ], // meta map
-                    file( params.test_data['bacteroides_fragilis']['illumina']['test1_contigs_fa_gz'], checkIfExists: true)
-                ]
-                input[1] = 'transcriptome'
-                input[2] = 'bacteria_odb10'
-                input[3] = []
-                input[4] = []
-                """
-            }
-        }
-
-        then {
-            assert process.success
-
-            with(path(process.out.short_summaries_txt[0][1]).text) {
-                assert contains('BUSCO version')
-                assert contains('The lineage dataset is')
-                assert contains('BUSCO was run in mode')
-                assert contains('Complete BUSCOs')
-                assert contains('Missing BUSCOs')
-                assert contains('Dependencies and versions')
-            }
-
-            with(path(process.out.short_summaries_json[0][1]).text) {
-                assert contains('one_line_summary')
-                assert contains('mode')
-                assert contains('dataset')
-            }
-
-            assert snapshot(
-                    process.out.batch_summary[0][1],
-                    process.out.full_table[0][1],
-                    process.out.missing_busco_list[0][1],
-                    process.out.translated_dir[0][1],
-                    process.out.single_copy_proteins[0][1],
-                    process.out.versions[0]
-                ).match()
-
-            with(file(process.out.seq_dir[0][1]).listFiles().collect { it.name }) {
-                assert contains('single_copy_busco_sequences.tar.gz')
-                assert contains('multi_copy_busco_sequences.tar.gz')
-                assert contains('fragmented_busco_sequences.tar.gz')
-            }
-
-            with(path("${process.out.busco_dir[0][1]}/logs/busco.log").text) {
-                assert contains('DEBUG:busco.run_BUSCO')
-                assert contains('Results from dataset')
-                assert contains('how to cite BUSCO')
-            }
-        }
-
-    }
-
-    test("minimal-stub") {
-
-        options '-stub'
-
-        when {
-            process {
-                """
-                input[0] = [
-                    [ id:'test' ], // meta map
-                    file( params.test_data['bacteroides_fragilis']['genome']['genome_fna_gz'], checkIfExists: true)
-                ]
-                input[1] = 'genome'
-                input[2] = 'bacteria_odb10'
-                input[3] = []
-                input[4] = []
-                """
-            }
-        }
-
-        then {
-            assertAll(
-                { assert process.success },
-                { assert snapshot(process.out).match() }
-            )
-        }
-    }
-
-}
diff --git a/modules/nf-core/busco/busco/tests/main.nf.test.snap b/modules/nf-core/busco/busco/tests/main.nf.test.snap
deleted file mode 100644
index 1b6411b..0000000
--- a/modules/nf-core/busco/busco/tests/main.nf.test.snap
+++ /dev/null
@@ -1,230 +0,0 @@
-{
-    "minimal-stub": {
-        "content": [
-            {
-                "0": [
-                    [
-                        {
-                            "id": "test"
-                        },
-                        "test-bacteria_odb10-busco.batch_summary.txt:md5,d41d8cd98f00b204e9800998ecf8427e"
-                    ]
-                ],
-                "1": [
-                    
-                ],
-                "2": [
-                    
-                ],
-                "3": [
-                    
-                ],
-                "4": [
-                    
-                ],
-                "5": [
-                    
-                ],
-                "6": [
-                    [
-                        {
-                            "id": "test"
-                        },
-                        [
-                            
-                        ]
-                    ]
-                ],
-                "7": [
-                    
-                ],
-                "8": [
-                    [
-                        {
-                            "id": "test"
-                        },
-                        [
-                            [
-                                [
-                                    [
-                                        
-                                    ]
-                                ]
-                            ]
-                        ]
-                    ]
-                ],
-                "9": [
-                    "versions.yml:md5,3fc94714b95c2dc15399a4229d9dd1d9"
-                ],
-                "batch_summary": [
-                    [
-                        {
-                            "id": "test"
-                        },
-                        "test-bacteria_odb10-busco.batch_summary.txt:md5,d41d8cd98f00b204e9800998ecf8427e"
-                    ]
-                ],
-                "busco_dir": [
-                    [
-                        {
-                            "id": "test"
-                        },
-                        [
-                            [
-                                [
-                                    [
-                                        
-                                    ]
-                                ]
-                            ]
-                        ]
-                    ]
-                ],
-                "full_table": [
-                    
-                ],
-                "missing_busco_list": [
-                    
-                ],
-                "seq_dir": [
-                    [
-                        {
-                            "id": "test"
-                        },
-                        [
-                            
-                        ]
-                    ]
-                ],
-                "short_summaries_json": [
-                    
-                ],
-                "short_summaries_txt": [
-                    
-                ],
-                "single_copy_proteins": [
-                    
-                ],
-                "translated_dir": [
-                    
-                ],
-                "versions": [
-                    "versions.yml:md5,3fc94714b95c2dc15399a4229d9dd1d9"
-                ]
-            }
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-05-03T13:28:04.451297"
-    },
-    "test_busco_eukaryote_augustus": {
-        "content": [
-            "test-eukaryota_odb10-busco.batch_summary.txt:md5,3ea3bdc423a461dae514d816bdc61c89",
-            "versions.yml:md5,3fc94714b95c2dc15399a4229d9dd1d9"
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-05-03T13:26:36.974986"
-    },
-    "test_busco_genome_single_fasta": {
-        "content": [
-            "test-bacteria_odb10-busco.batch_summary.txt:md5,21b3fb771cf36be917cc451540d999be",
-            "full_table.tsv:md5,638fe7590f442c57361554dae330eca1",
-            "missing_busco_list.tsv:md5,1530af4fe7673a6d001349537bcd410a",
-            "versions.yml:md5,3fc94714b95c2dc15399a4229d9dd1d9"
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-05-03T13:22:45.07816"
-    },
-    "test_busco_genome_multi_fasta": {
-        "content": [
-            "test-bacteria_odb10-busco.batch_summary.txt:md5,fcd3c208913e8abda3d6742c43fec5fa",
-            [
-                "full_table.tsv:md5,c657edcc7d0de0175869717551df6e83",
-                "full_table.tsv:md5,638fe7590f442c57361554dae330eca1"
-            ],
-            [
-                "missing_busco_list.tsv:md5,aceb66e347a353cb7fca8e2a725f9112",
-                "missing_busco_list.tsv:md5,1530af4fe7673a6d001349537bcd410a"
-            ],
-            "versions.yml:md5,3fc94714b95c2dc15399a4229d9dd1d9"
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-05-03T13:23:50.255602"
-    },
-    "test_busco_eukaryote_metaeuk": {
-        "content": [
-            "test-eukaryota_odb10-busco.batch_summary.txt:md5,ff6d8277e452a83ce9456bbee666feb6",
-            "full_table.tsv:md5,92b1b1d5cb5ea0e2093d16f00187e8c7",
-            "missing_busco_list.tsv:md5,0352e563de290bf804c708323c35a9e3",
-            "versions.yml:md5,3fc94714b95c2dc15399a4229d9dd1d9"
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-05-03T13:25:38.159041"
-    },
-    "test_busco_transcriptome": {
-        "content": [
-            "test-bacteria_odb10-busco.batch_summary.txt:md5,8734b3f379c4c0928e5dd4ea1873dc64",
-            "full_table.tsv:md5,1b2ce808fdafa744c56b5f781551272d",
-            "missing_busco_list.tsv:md5,a6931b6470262b997b8b99ea0f1d14a4",
-            [
-                "1024388at2.faa:md5,797d603d262a6595a112e25b73e878b0",
-                "1054741at2.faa:md5,cd4b928cba6b19b4437746ba507e7195",
-                "1093223at2.faa:md5,df9549708e5ffcfaee6a74dd70a0e5dc",
-                "1151822at2.faa:md5,12726afc1cdc40c13392e1596e93df3a",
-                "143460at2.faa:md5,d887431fd988a5556a523440f02d9594",
-                "1491686at2.faa:md5,d03362d19979b27306c192f1c74a84e5",
-                "1504821at2.faa:md5,4f5f6e5c57bac0092c1d85ded73d7e67",
-                "1574817at2.faa:md5,1153e55998c2929eacad2aed7d08d248",
-                "1592033at2.faa:md5,bb7a59e5f3a57ba12d10dabf4c77ab57",
-                "1623045at2.faa:md5,8fe38155feb1802beb97ef7714837bf5",
-                "1661836at2.faa:md5,6c6d592c2fbb0d7a4e5e1f47a15644f0",
-                "1674344at2.faa:md5,bb41b44e53565a54cadf0b780532fe08",
-                "1698718at2.faa:md5,f233860000028eb00329aa85236c71e5",
-                "1990650at2.faa:md5,34a2d29c5f8b6253159ddb7a43fa1829",
-                "223233at2.faa:md5,dec6705c7846c989296e73942f953cbc",
-                "402899at2.faa:md5,acc0f271f9a586d2ce1ee41669b22999",
-                "505485at2.faa:md5,aa0391f8fa5d9bd19b30d844d5a99845",
-                "665824at2.faa:md5,47f8ad43b6a6078206feb48c2e552793",
-                "776861at2.faa:md5,f8b90c13f7c6be828dea3bb920195e3d",
-                "874197at2.faa:md5,8d22a35a768debe6f376fc695d233a69",
-                "932854at2.faa:md5,2eff2de1ab83b22f3234a529a44e22bb",
-                "95696at2.faa:md5,247bfd1aef432f7b5456307768e9149c"
-            ],
-            "single_copy_proteins.faa:md5,73e2c5d6a9b0f01f2deea3cc5f21b764",
-            "versions.yml:md5,3fc94714b95c2dc15399a4229d9dd1d9"
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-05-03T13:27:53.992893"
-    },
-    "test_busco_protein": {
-        "content": [
-            "test-bacteria_odb10-busco.batch_summary.txt:md5,f5a782378f9f94a748aa907381fdef91",
-            "full_table.tsv:md5,812ab6a0496fccab774643cf40c4f2a8",
-            "missing_busco_list.tsv:md5,aceb66e347a353cb7fca8e2a725f9112",
-            "versions.yml:md5,3fc94714b95c2dc15399a4229d9dd1d9"
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-05-03T13:27:12.724862"
-    }
-}
\ No newline at end of file
diff --git a/modules/nf-core/busco/busco/tests/nextflow.augustus.config b/modules/nf-core/busco/busco/tests/nextflow.augustus.config
deleted file mode 100644
index 84daa69..0000000
--- a/modules/nf-core/busco/busco/tests/nextflow.augustus.config
+++ /dev/null
@@ -1,5 +0,0 @@
-process {
-    withName: 'BUSCO_BUSCO' {
-        ext.args = '--tar --augustus'
-    }
-}
diff --git a/modules/nf-core/busco/busco/tests/nextflow.config b/modules/nf-core/busco/busco/tests/nextflow.config
deleted file mode 100644
index 1ec3fec..0000000
--- a/modules/nf-core/busco/busco/tests/nextflow.config
+++ /dev/null
@@ -1,5 +0,0 @@
-process {
-    withName: 'BUSCO_BUSCO' {
-        ext.args = '--tar'
-    }
-}
diff --git a/modules/nf-core/busco/busco/tests/nextflow.metaeuk.config b/modules/nf-core/busco/busco/tests/nextflow.metaeuk.config
deleted file mode 100644
index c141844..0000000
--- a/modules/nf-core/busco/busco/tests/nextflow.metaeuk.config
+++ /dev/null
@@ -1,5 +0,0 @@
-process {
-    withName: 'BUSCO_BUSCO' {
-        ext.args = '--tar --metaeuk'
-    }
-}
diff --git a/modules/nf-core/busco/busco/tests/old_test.yml b/modules/nf-core/busco/busco/tests/old_test.yml
deleted file mode 100644
index 75177f5..0000000
--- a/modules/nf-core/busco/busco/tests/old_test.yml
+++ /dev/null
@@ -1,624 +0,0 @@
-- name: busco test_busco_genome_single_fasta
-  command: nextflow run ./tests/modules/nf-core/busco -entry test_busco_genome_single_fasta -c ./tests/config/nextflow.config
-  tags:
-    - busco
-  files:
-    - path: output/busco/short_summary.specific.bacteria_odb10.genome.fna.json
-      contains:
-        - "one_line_summary"
-        - "mode"
-        - "dataset"
-    - path: output/busco/short_summary.specific.bacteria_odb10.genome.fna.txt
-      contains:
-        - "BUSCO version"
-        - "The lineage dataset is"
-        - "BUSCO was run in mode"
-        - "Complete BUSCOs"
-        - "Missing BUSCOs"
-        - "Dependencies and versions"
-    - path: output/busco/test-bacteria_odb10-busco.batch_summary.txt
-      md5sum: bc2440f8a68d7fbf931ff911c1c3fdfa
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/logs/bbtools_err.log
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/logs/bbtools_out.log
-      md5sum: 9caf1a1434414c78562eb0bbb9c0e53f
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/logs/hmmsearch_err.log
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/logs/hmmsearch_out.log
-      contains:
-        - "# hmmsearch :: search profile(s) against a sequence database"
-        - "# target sequence database:"
-        - "Internal pipeline statistics summary:"
-        - "[ok]"
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/logs/prodigal_err.log
-      md5sum: 538510cfc7483498210f01e53fe035ad
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/logs/prodigal_out.log
-      md5sum: 61050b0706addc9498b2088a2d6efa9a
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/prodigal_output/.checkpoint
-      contains:
-        - "Tool: prodigal"
-        - "Completed"
-        - "jobs"
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/prodigal_output/predicted_genes/predicted.faa
-      md5sum: 836e9a80d33d8b89168f07ddc13ee991
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/prodigal_output/predicted_genes/predicted.fna
-      md5sum: 20eeb75f86842e6e136f02bca8b73a9f
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_11.faa
-      md5sum: 836e9a80d33d8b89168f07ddc13ee991
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_11.fna
-      md5sum: 20eeb75f86842e6e136f02bca8b73a9f
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_11_err.log
-      md5sum: 538510cfc7483498210f01e53fe035ad
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_11_out.log
-      md5sum: 61050b0706addc9498b2088a2d6efa9a
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/.bbtools_output/.checkpoint
-      contains:
-        - "Tool: bbtools"
-        - "Completed"
-        - "jobs"
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/busco_sequences/fragmented_busco_sequences.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/busco_sequences/multi_copy_busco_sequences.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/busco_sequences/single_copy_busco_sequences.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/full_table.tsv
-      md5sum: c56edab1dc1522e993c25ae2b730799f
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/hmmer_output.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/missing_busco_list.tsv
-      md5sum: b533ef30270f27160acce85a22d01bf5
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/short_summary.json
-      contains:
-        - "one_line_summary"
-        - "mode"
-        - "lineage_dataset"
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/short_summary.txt
-      contains:
-        - "# BUSCO version is:"
-        - "Results:"
-        - "busco:"
-    - path: output/busco/test-bacteria_odb10-busco/logs/busco.log
-      contains:
-        - "DEBUG:busco.run_BUSCO"
-        - "Results from dataset"
-        - "how to cite BUSCO"
-    - path: output/busco/versions.yml
-
-- name: busco test_busco_genome_multi_fasta
-  command: nextflow run ./tests/modules/nf-core/busco -entry test_busco_genome_multi_fasta -c ./tests/config/nextflow.config
-  tags:
-    - busco
-  files:
-    - path: output/busco/short_summary.specific.bacteria_odb10.genome.fasta.json
-      contains:
-        - "one_line_summary"
-        - "mode"
-        - "dataset"
-    - path: output/busco/short_summary.specific.bacteria_odb10.genome.fasta.txt
-      contains:
-        - "BUSCO version"
-        - "The lineage dataset is"
-        - "BUSCO was run in mode"
-        - "Complete BUSCOs"
-        - "Missing BUSCOs"
-        - "Dependencies and versions"
-    - path: output/busco/short_summary.specific.bacteria_odb10.genome.fna.json
-      contains:
-        - "one_line_summary"
-        - "mode"
-        - "dataset"
-    - path: output/busco/short_summary.specific.bacteria_odb10.genome.fna.txt
-      contains:
-        - "BUSCO version"
-        - "The lineage dataset is"
-        - "BUSCO was run in mode"
-        - "Complete BUSCOs"
-        - "Missing BUSCOs"
-        - "Dependencies and versions"
-    - path: output/busco/test-bacteria_odb10-busco.batch_summary.txt
-      md5sum: 8c64c1a28b086ef2ee444f99cbed5f7d
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/logs/bbtools_err.log
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/logs/bbtools_out.log
-      md5sum: 8f047bdb33264d22a83920bc2c63f29a
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/logs/hmmsearch_err.log
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/logs/hmmsearch_out.log
-      contains:
-        - "# hmmsearch :: search profile(s) against a sequence database"
-        - "# target sequence database:"
-        - "Internal pipeline statistics summary:"
-        - "[ok]"
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/logs/prodigal_err.log
-      md5sum: c1fdc6977332f53dfe7f632733bb4585
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/logs/prodigal_out.log
-      md5sum: 50752acb1c5a20be886bfdfc06635bcb
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/prodigal_output/.checkpoint
-      contains:
-        - "Tool: prodigal"
-        - "Completed"
-        - "jobs"
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/prodigal_output/predicted_genes/predicted.faa
-      md5sum: 8166471fc5f08c82fd5643ab42327f9d
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/prodigal_output/predicted_genes/predicted.fna
-      md5sum: ddc508a18f60e7f3314534df50cdf8ca
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_11.faa
-      md5sum: 8166471fc5f08c82fd5643ab42327f9d
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_11.fna
-      md5sum: ddc508a18f60e7f3314534df50cdf8ca
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_11_err.log
-      md5sum: c1fdc6977332f53dfe7f632733bb4585
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_11_out.log
-      md5sum: 50752acb1c5a20be886bfdfc06635bcb
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_4.faa
-      md5sum: e56fd59c38248dc21ac94355dca98121
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_4.fna
-      md5sum: b365f84bf99c68357952e0b98ed7ce42
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_4_err.log
-      md5sum: e5f14d7925ba14a0f9850542f3739894
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_4_out.log
-      md5sum: d41971bfc1b621d4ffd2633bc47017ea
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/run_bacteria_odb10/.bbtools_output/.checkpoint
-      contains:
-        - "Tool: bbtools"
-        - "Completed"
-        - "jobs"
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/run_bacteria_odb10/busco_sequences/fragmented_busco_sequences.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/run_bacteria_odb10/busco_sequences/multi_copy_busco_sequences.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/run_bacteria_odb10/busco_sequences/single_copy_busco_sequences.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/run_bacteria_odb10/full_table.tsv
-      md5sum: c9651b88b10871abc260ee655898e828
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/run_bacteria_odb10/hmmer_output.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/run_bacteria_odb10/missing_busco_list.tsv
-      md5sum: 9939309df2da5419de88c32d1435c779
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/run_bacteria_odb10/short_summary.json
-      contains:
-        - "one_line_summary"
-        - "mode"
-        - "dataset"
-    - path: output/busco/test-bacteria_odb10-busco/genome.fasta/run_bacteria_odb10/short_summary.txt
-      contains:
-        - "# BUSCO version is:"
-        - "Results:"
-        - "busco:"
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/logs/bbtools_err.log
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/logs/bbtools_out.log
-      md5sum: 9caf1a1434414c78562eb0bbb9c0e53f
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/logs/hmmsearch_err.log
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/logs/hmmsearch_out.log
-      contains:
-        - "# hmmsearch :: search profile(s) against a sequence database"
-        - "# target sequence database:"
-        - "Internal pipeline statistics summary:"
-        - "[ok]"
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/logs/prodigal_err.log
-      md5sum: 538510cfc7483498210f01e53fe035ad
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/logs/prodigal_out.log
-      md5sum: 61050b0706addc9498b2088a2d6efa9a
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/prodigal_output/.checkpoint
-      contains:
-        - "Tool: prodigal"
-        - "Completed"
-        - "jobs"
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/prodigal_output/predicted_genes/predicted.faa
-      md5sum: 836e9a80d33d8b89168f07ddc13ee991
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/prodigal_output/predicted_genes/predicted.fna
-      md5sum: 20eeb75f86842e6e136f02bca8b73a9f
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_11.faa
-      md5sum: 836e9a80d33d8b89168f07ddc13ee991
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_11.fna
-      md5sum: 20eeb75f86842e6e136f02bca8b73a9f
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_11_err.log
-      md5sum: 538510cfc7483498210f01e53fe035ad
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/prodigal_output/predicted_genes/tmp/prodigal_mode_single_code_11_out.log
-      md5sum: 61050b0706addc9498b2088a2d6efa9a
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/.bbtools_output/.checkpoint
-      contains:
-        - "Tool: bbtools"
-        - "Completed"
-        - "jobs"
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/busco_sequences/fragmented_busco_sequences.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/busco_sequences/multi_copy_busco_sequences.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/busco_sequences/single_copy_busco_sequences.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/full_table.tsv
-      md5sum: c56edab1dc1522e993c25ae2b730799f
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/hmmer_output.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/missing_busco_list.tsv
-      md5sum: b533ef30270f27160acce85a22d01bf5
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/short_summary.json
-      contains:
-        - "one_line_summary"
-        - "mode"
-        - "dataset"
-    - path: output/busco/test-bacteria_odb10-busco/genome.fna/run_bacteria_odb10/short_summary.txt
-      contains:
-        - "# BUSCO version is:"
-        - "Results:"
-        - "busco:"
-    - path: output/busco/test-bacteria_odb10-busco/logs/busco.log
-      contains:
-        - "DEBUG:busco.run_BUSCO"
-        - "Results from dataset"
-        - "how to cite BUSCO"
-    - path: output/busco/versions.yml
-
-- name: busco test_busco_eukaryote_metaeuk
-  command: nextflow run ./tests/modules/nf-core/busco -entry test_busco_eukaryote_metaeuk -c ./tests/config/nextflow.config
-  tags:
-    - busco
-  files:
-    - path: output/busco/short_summary.specific.eukaryota_odb10.genome.fasta.json
-      contains:
-        - "one_line_summary"
-        - "mode"
-        - "dataset"
-    - path: output/busco/short_summary.specific.eukaryota_odb10.genome.fasta.txt
-      contains:
-        - "BUSCO version"
-        - "The lineage dataset is"
-        - "BUSCO was run in mode"
-        - "Complete BUSCOs"
-        - "Missing BUSCOs"
-        - "Dependencies and versions"
-    - path: output/busco/test-eukaryota_odb10-busco.batch_summary.txt
-      md5sum: ff6d8277e452a83ce9456bbee666feb6
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/bbtools_err.log
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/bbtools_out.log
-      md5sum: e63debaa653f18f7405d936050abc093
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/hmmsearch_err.log
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/hmmsearch_out.log
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/metaeuk_run1_err.log
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/metaeuk_run1_out.log
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/metaeuk_run2_err.log
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/metaeuk_run2_out.log
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/.bbtools_output/.checkpoint
-      contains:
-        - "Tool: bbtools"
-        - "Completed"
-        - "jobs"
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/busco_sequences/fragmented_busco_sequences.tar.gz
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/busco_sequences/multi_copy_busco_sequences.tar.gz
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/busco_sequences/single_copy_busco_sequences.tar.gz
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/full_table.tsv
-      md5sum: bd880e90b9e5620a58943a3e0f9ff16b
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/hmmer_output.tar.gz
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/.checkpoint
-      contains:
-        - "Tool: metaeuk"
-        - "Completed"
-        - "jobs"
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/combined_pred_proteins.fas
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/initial_results/genome.fasta.codon.fas
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/initial_results/genome.fasta.fas
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/initial_results/genome.fasta.gff
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/initial_results/genome.fasta.headersMap.tsv
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/refseq_db_rerun.faa
-      md5sum: d80b8fa4cb5ed0d47d63d6aa93635bc2
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/rerun_results/genome.fasta.codon.fas
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/rerun_results/genome.fasta.fas
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/rerun_results/genome.fasta.gff
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/rerun_results/genome.fasta.headersMap.tsv
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/missing_busco_list.tsv
-      md5sum: 1e8e79c540fd2e69ba0d2659d9eb2988
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/short_summary.json
-      contains:
-        - "one_line_summary"
-        - "mode"
-        - "dataset"
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/short_summary.txt
-      contains:
-        - "# BUSCO version is:"
-        - "Results:"
-        - "busco:"
-    - path: output/busco/test-eukaryota_odb10-busco/logs/busco.log
-      contains:
-        - "DEBUG:busco.run_BUSCO"
-        - "Results from dataset"
-        - "how to cite BUSCO"
-    - path: output/busco/versions.yml
-
-- name: busco test_busco_eukaryote_augustus
-  command: nextflow run ./tests/modules/nf-core/busco -entry test_busco_eukaryote_augustus -c ./tests/config/nextflow.config
-  tags:
-    - busco
-  files:
-    - path: output/busco/short_summary.specific.eukaryota_odb10.genome.fasta.json
-      contains:
-        - "one_line_summary"
-        - "mode"
-        - "dataset"
-    - path: output/busco/short_summary.specific.eukaryota_odb10.genome.fasta.txt
-      contains:
-        - "BUSCO version"
-        - "The lineage dataset is"
-        - "BUSCO was run in mode"
-        - "Complete BUSCOs"
-        - "Missing BUSCOs"
-        - "Dependencies and versions"
-    - path: output/busco/test-eukaryota_odb10-busco.batch_summary.txt
-      md5sum: ff6d8277e452a83ce9456bbee666feb6
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/bbtools_err.log
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/bbtools_out.log
-      md5sum: e63debaa653f18f7405d936050abc093
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/hmmsearch_err.log
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/hmmsearch_out.log
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/metaeuk_run1_err.log
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/metaeuk_run1_out.log
-      contains:
-        - "metaeuk"
-        - "easy-predict"
-        - "Compute score and coverage"
-        - "Time for processing:"
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/metaeuk_run2_err.log
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/logs/metaeuk_run2_out.log
-      contains:
-        - "metaeuk"
-        - "easy-predict"
-        - "Compute score and coverage"
-        - "Time for processing:"
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/.bbtools_output/.checkpoint
-      contains:
-        - "Tool: bbtools"
-        - "Completed"
-        - "jobs"
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/busco_sequences/fragmented_busco_sequences.tar.gz
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/busco_sequences/multi_copy_busco_sequences.tar.gz
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/busco_sequences/single_copy_busco_sequences.tar.gz
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/full_table.tsv
-      md5sum: bd880e90b9e5620a58943a3e0f9ff16b
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/hmmer_output.tar.gz
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/.checkpoint
-      contains:
-        - "Tool: metaeuk"
-        - "Completed"
-        - "jobs"
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/combined_pred_proteins.fas
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/initial_results/genome.fasta.codon.fas
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/initial_results/genome.fasta.fas
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/initial_results/genome.fasta.gff
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/initial_results/genome.fasta.headersMap.tsv
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/refseq_db_rerun.faa
-      md5sum: d80b8fa4cb5ed0d47d63d6aa93635bc2
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/rerun_results/genome.fasta.codon.fas
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/rerun_results/genome.fasta.fas
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/rerun_results/genome.fasta.gff
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/metaeuk_output/rerun_results/genome.fasta.headersMap.tsv
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/missing_busco_list.tsv
-      md5sum: 1e8e79c540fd2e69ba0d2659d9eb2988
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/short_summary.json
-      contains:
-        - "one_line_summary"
-        - "mode"
-        - "dataset"
-    - path: output/busco/test-eukaryota_odb10-busco/genome.fasta/run_eukaryota_odb10/short_summary.txt
-      contains:
-        - "# BUSCO version is:"
-        - "Results:"
-        - "busco:"
-    - path: output/busco/test-eukaryota_odb10-busco/logs/busco.log
-      contains:
-        - "DEBUG:busco.run_BUSCO"
-        - "Results from dataset"
-        - "how to cite BUSCO"
-    - path: output/busco/versions.yml
-
-- name: busco test_busco_protein
-  command: nextflow run ./tests/modules/nf-core/busco -entry test_busco_protein -c ./tests/config/nextflow.config
-  tags:
-    - busco
-  files:
-    - path: output/busco/short_summary.specific.bacteria_odb10.proteome.fasta.json
-      contains:
-        - "one_line_summary"
-        - "mode"
-        - "dataset"
-    - path: output/busco/short_summary.specific.bacteria_odb10.proteome.fasta.txt
-      contains:
-        - "BUSCO version"
-        - "The lineage dataset is"
-        - "BUSCO was run in mode"
-        - "Complete BUSCOs"
-        - "Missing BUSCOs"
-        - "Dependencies and versions"
-    - path: output/busco/test-bacteria_odb10-busco.batch_summary.txt
-      md5sum: 7a65e6cbb6c56a2ea4e739ae0aa3297d
-    - path: output/busco/test-bacteria_odb10-busco/logs/busco.log
-      contains:
-        - "DEBUG:busco.run_BUSCO"
-        - "Results from dataset"
-        - "how to cite BUSCO"
-    - path: output/busco/test-bacteria_odb10-busco/proteome.fasta/logs/hmmsearch_err.log
-    - path: output/busco/test-bacteria_odb10-busco/proteome.fasta/logs/hmmsearch_out.log
-      contains:
-        - "# hmmsearch :: search profile(s) against a sequence database"
-        - "# target sequence database:"
-        - "Internal pipeline statistics summary:"
-        - "[ok]"
-    - path: output/busco/test-bacteria_odb10-busco/proteome.fasta/run_bacteria_odb10/busco_sequences/fragmented_busco_sequences.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/proteome.fasta/run_bacteria_odb10/busco_sequences/multi_copy_busco_sequences.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/proteome.fasta/run_bacteria_odb10/busco_sequences/single_copy_busco_sequences.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/proteome.fasta/run_bacteria_odb10/full_table.tsv
-      md5sum: 0e34f1011cd83ea1d5d5103ec62b8922
-    - path: output/busco/test-bacteria_odb10-busco/proteome.fasta/run_bacteria_odb10/hmmer_output.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/proteome.fasta/run_bacteria_odb10/missing_busco_list.tsv
-      md5sum: 9939309df2da5419de88c32d1435c779
-    - path: output/busco/test-bacteria_odb10-busco/proteome.fasta/run_bacteria_odb10/short_summary.json
-      contains:
-        - "one_line_summary"
-        - "mode"
-        - "dataset"
-    - path: output/busco/test-bacteria_odb10-busco/proteome.fasta/run_bacteria_odb10/short_summary.txt
-      contains:
-        - "# BUSCO version is:"
-        - "Results:"
-        - "busco:"
-    - path: output/busco/versions.yml
-
-- name: busco test_busco_transcriptome
-  command: nextflow run ./tests/modules/nf-core/busco -entry test_busco_transcriptome -c ./tests/config/nextflow.config
-  tags:
-    - busco
-  files:
-    - path: output/busco/short_summary.specific.bacteria_odb10.test1.contigs.fa.json
-      contains:
-        - "one_line_summary"
-        - "mode"
-        - "dataset"
-    - path: output/busco/short_summary.specific.bacteria_odb10.test1.contigs.fa.txt
-      contains:
-        - "BUSCO version"
-        - "The lineage dataset is"
-        - "BUSCO was run in mode"
-        - "Complete BUSCOs"
-        - "Missing BUSCOs"
-        - "Dependencies and versions"
-    - path: output/busco/test-bacteria_odb10-busco.batch_summary.txt
-      md5sum: 46118ecf60d1b87d22b96d80f4f03632
-    - path: output/busco/test-bacteria_odb10-busco/logs/busco.log
-      contains:
-        - "DEBUG:busco.run_BUSCO"
-        - "Results from dataset"
-        - "how to cite BUSCO"
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/blast_db/.checkpoint
-      contains:
-        - "Tool: makeblastdb"
-        - "Completed"
-        - "jobs"
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/blast_db/test1.contigs.fa.ndb
-      md5sum: 3788c017fe5e6f0f58224e9cdd21822b
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/blast_db/test1.contigs.fa.nhr
-      md5sum: 8ecd2ce392bb5e25ddbe1d85f879582e
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/blast_db/test1.contigs.fa.nin
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/blast_db/test1.contigs.fa.njs
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/blast_db/test1.contigs.fa.not
-      md5sum: 0c340e376c7e85d19f82ec1a833e6a6e
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/blast_db/test1.contigs.fa.nsq
-      md5sum: 532d5c0a7ea00fe95ca3c97cb3be6198
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/blast_db/test1.contigs.fa.ntf
-      md5sum: de1250813f0c7affc6d12dac9d0fb6bb
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/blast_db/test1.contigs.fa.nto
-      md5sum: ff74bd41f9cc9b011c63a32c4f7693bf
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/logs/hmmsearch_err.log
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/logs/hmmsearch_out.log
-      contains:
-        - "# hmmsearch :: search profile(s) against a sequence database"
-        - "# target sequence database:"
-        - "Internal pipeline statistics summary:"
-        - "[ok]"
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/logs/makeblastdb_err.log
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/logs/makeblastdb_out.log
-      contains:
-        - "Building a new DB"
-        - "Adding sequences from FASTA"
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/logs/tblastn_err.log
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/logs/tblastn_out.log
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/.checkpoint
-      contains:
-        - "Tool: tblastn"
-        - "Completed"
-        - "jobs"
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/coordinates.tsv
-      md5sum: cc30eed321944af293452bdbcfc24292
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_101.temp
-      md5sum: 73e9c65fc83fedc58f57f09b08f08238
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_119.temp
-      md5sum: 7fa4cc7955ec0cc36330a221c579b975
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_129.temp
-      md5sum: 6f1601c875d019e3f6f1f98ed8e988d4
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_138.temp
-      md5sum: 3f8e034686cd240c2330650d791bcae2
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_143.temp
-      md5sum: df3dfa8e9ba30ed70cf75b5e7abf2179
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_172.temp
-      md5sum: 7d463e0e6cf7169bc9077d8dc776dda1
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_178.temp
-      md5sum: 2288edf7fa4f88f51b4cf4d94086f77e
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_188.temp
-      md5sum: 029906abbad6d87fc57830dd548cac24
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_195.temp
-      md5sum: 4937f3b348774a31b1160a00297c29cc
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_210.temp
-      md5sum: afcb20ba4c466479d6b91c8c62251e1f
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_232.temp
-      md5sum: 2e1e823ce017345bd998191a39fa9924
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_268.temp
-      md5sum: 08c2d82c34ecffbe1c638b410349412e
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_29.temp
-      md5sum: cd9b63cf93524284781535c888313764
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_44.temp
-      md5sum: d1929b742b24ebe379bf4801ca882dca
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_58.temp
-      md5sum: 69215765b010c05336538cb322c900b3
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_72.temp
-      md5sum: 6feaa1cc3b0899a147ea9d466878f3e3
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_80.temp
-      md5sum: 13625eae14e860a96ce17cd4e37e9d01
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_81.temp
-      md5sum: e14b2484649b0dbc8926815c207b806d
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_93.temp
-      md5sum: 6902c93691df00e690faea914c71839e
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/sequences/k141_97.temp
-      md5sum: 0a0d9d38a83acbd5ad43c29cdf429988
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/blast_output/tblastn.tsv
-      contains:
-        - "TBLASTN"
-        - "BLAST processed"
-        - "queries"
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/busco_sequences/fragmented_busco_sequences.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/busco_sequences/multi_copy_busco_sequences.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/busco_sequences/single_copy_busco_sequences.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/full_table.tsv
-      md5sum: 24df25199e13c88bd892fc3e7b541ca0
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/hmmer_output.tar.gz
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/missing_busco_list.tsv
-      md5sum: e7232e2b8cca4fdfdd9e363b39ebbc81
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/short_summary.json
-      contains:
-        - "one_line_summary"
-        - "mode"
-        - "dataset"
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/short_summary.txt
-      contains:
-        - "# BUSCO version is:"
-        - "Results:"
-        - "busco:"
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/run_bacteria_odb10/single_copy_proteins.faa
-      md5sum: e04b9465733577ae6e4bccb7aa01e720
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/1024388at2.faa
-      md5sum: 7333c39a20258f20c7019ea0cd83157c
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/1054741at2.faa
-      md5sum: ebb481e77a824685fbe04d8a2f3a0d7d
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/1093223at2.faa
-      md5sum: 34621c7d499034e8f8e6b92fd4020a93
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/1151822at2.faa
-      md5sum: aa89ca381c1c70c9c4e1380351ca7c2a
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/143460at2.faa
-      md5sum: f2e91d78b8dd3722840378789f29e8c8
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/1491686at2.faa
-      md5sum: 73c25aef5c9cba7f4151804941b146ea
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/1504821at2.faa
-      md5sum: cda556018d1f84ebe517e89f6fc107d0
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/1574817at2.faa
-      md5sum: a9096c9fb8b25c78a72871ab0463acdc
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/1592033at2.faa
-      md5sum: e463d25ce186c0cebfd749474f3a4c64
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/1623045at2.faa
-      md5sum: f2cfd241590c6d8377286d6135480937
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/1661836at2.faa
-      md5sum: 586569546fb9861502468e3d9ba2775c
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/1674344at2.faa
-      md5sum: 24c658bee14ad84b062d81ad96642eb8
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/1698718at2.faa
-      md5sum: 0b8e26ddf5149bbd8805be7af125208d
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/1990650at2.faa
-      md5sum: 159320712ee01fb2ccb31a25df44eead
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/223233at2.faa
-      md5sum: 812629c0b06ac3d18661c2ca78de0c08
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/402899at2.faa
-      md5sum: f7ff4e1591342d30b77392a2e84b57d9
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/505485at2.faa
-      md5sum: 7b34a24fc49c540d46fcf96ff5129564
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/665824at2.faa
-      md5sum: 4cff2df64f6bcaff8bc19c234c8bcccd
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/776861at2.faa
-      md5sum: 613af7a3fea30ea2bece66f603b9284a
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/874197at2.faa
-      md5sum: a7cd1b13c9ef91c7ef4e31614166f197
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/932854at2.faa
-      md5sum: fe313ffd5efdb0fed887a04fba352552
-    - path: output/busco/test-bacteria_odb10-busco/test1.contigs.fa/translated_proteins/95696at2.faa
-      md5sum: 4e1f30a2fea4dfbf9bb7fae2700622a0
-    - path: output/busco/versions.yml
diff --git a/modules/nf-core/busco/busco/tests/tags.yml b/modules/nf-core/busco/busco/tests/tags.yml
deleted file mode 100644
index 7c4d283..0000000
--- a/modules/nf-core/busco/busco/tests/tags.yml
+++ /dev/null
@@ -1,2 +0,0 @@
-busco/busco:
-  - "modules/nf-core/busco/busco/**"
diff --git a/modules/nf-core/fastqc/environment.yml b/modules/nf-core/fastqc/environment.yml
deleted file mode 100644
index 1787b38..0000000
--- a/modules/nf-core/fastqc/environment.yml
+++ /dev/null
@@ -1,7 +0,0 @@
-name: fastqc
-channels:
-  - conda-forge
-  - bioconda
-  - defaults
-dependencies:
-  - bioconda::fastqc=0.12.1
diff --git a/modules/nf-core/fastqc/main.nf b/modules/nf-core/fastqc/main.nf
deleted file mode 100644
index d79f1c8..0000000
--- a/modules/nf-core/fastqc/main.nf
+++ /dev/null
@@ -1,61 +0,0 @@
-process FASTQC {
-    tag "$meta.id"
-    label 'process_medium'
-
-    conda "${moduleDir}/environment.yml"
-    container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ?
-        'https://depot.galaxyproject.org/singularity/fastqc:0.12.1--hdfd78af_0' :
-        'biocontainers/fastqc:0.12.1--hdfd78af_0' }"
-
-    input:
-    tuple val(meta), path(reads)
-
-    output:
-    tuple val(meta), path("*.html"), emit: html
-    tuple val(meta), path("*.zip") , emit: zip
-    path  "versions.yml"           , emit: versions
-
-    when:
-    task.ext.when == null || task.ext.when
-
-    script:
-    def args = task.ext.args ?: ''
-    def prefix = task.ext.prefix ?: "${meta.id}"
-    // Make list of old name and new name pairs to use for renaming in the bash while loop
-    def old_new_pairs = reads instanceof Path || reads.size() == 1 ? [[ reads, "${prefix}.${reads.extension}" ]] : reads.withIndex().collect { entry, index -> [ entry, "${prefix}_${index + 1}.${entry.extension}" ] }
-    def rename_to = old_new_pairs*.join(' ').join(' ')
-    def renamed_files = old_new_pairs.collect{ old_name, new_name -> new_name }.join(' ')
-
-    def memory_in_mb = MemoryUnit.of("${task.memory}").toUnit('MB')
-    // FastQC memory value allowed range (100 - 10000)
-    def fastqc_memory = memory_in_mb > 10000 ? 10000 : (memory_in_mb < 100 ? 100 : memory_in_mb)
-
-    """
-    printf "%s %s\\n" $rename_to | while read old_name new_name; do
-        [ -f "\${new_name}" ] || ln -s \$old_name \$new_name
-    done
-
-    fastqc \\
-        $args \\
-        --threads $task.cpus \\
-        --memory $fastqc_memory \\
-        $renamed_files
-
-    cat <<-END_VERSIONS > versions.yml
-    "${task.process}":
-        fastqc: \$( fastqc --version | sed '/FastQC v/!d; s/.*v//' )
-    END_VERSIONS
-    """
-
-    stub:
-    def prefix = task.ext.prefix ?: "${meta.id}"
-    """
-    touch ${prefix}.html
-    touch ${prefix}.zip
-
-    cat <<-END_VERSIONS > versions.yml
-    "${task.process}":
-        fastqc: \$( fastqc --version | sed '/FastQC v/!d; s/.*v//' )
-    END_VERSIONS
-    """
-}
diff --git a/modules/nf-core/fastqc/meta.yml b/modules/nf-core/fastqc/meta.yml
deleted file mode 100644
index ee5507e..0000000
--- a/modules/nf-core/fastqc/meta.yml
+++ /dev/null
@@ -1,57 +0,0 @@
-name: fastqc
-description: Run FastQC on sequenced reads
-keywords:
-  - quality control
-  - qc
-  - adapters
-  - fastq
-tools:
-  - fastqc:
-      description: |
-        FastQC gives general quality metrics about your reads.
-        It provides information about the quality score distribution
-        across your reads, the per base sequence content (%A/C/G/T).
-        You get information about adapter contamination and other
-        overrepresented sequences.
-      homepage: https://www.bioinformatics.babraham.ac.uk/projects/fastqc/
-      documentation: https://www.bioinformatics.babraham.ac.uk/projects/fastqc/Help/
-      licence: ["GPL-2.0-only"]
-input:
-  - meta:
-      type: map
-      description: |
-        Groovy Map containing sample information
-        e.g. [ id:'test', single_end:false ]
-  - reads:
-      type: file
-      description: |
-        List of input FastQ files of size 1 and 2 for single-end and paired-end data,
-        respectively.
-output:
-  - meta:
-      type: map
-      description: |
-        Groovy Map containing sample information
-        e.g. [ id:'test', single_end:false ]
-  - html:
-      type: file
-      description: FastQC report
-      pattern: "*_{fastqc.html}"
-  - zip:
-      type: file
-      description: FastQC report archive
-      pattern: "*_{fastqc.zip}"
-  - versions:
-      type: file
-      description: File containing software versions
-      pattern: "versions.yml"
-authors:
-  - "@drpatelh"
-  - "@grst"
-  - "@ewels"
-  - "@FelixKrueger"
-maintainers:
-  - "@drpatelh"
-  - "@grst"
-  - "@ewels"
-  - "@FelixKrueger"
diff --git a/modules/nf-core/fastqc/tests/main.nf.test b/modules/nf-core/fastqc/tests/main.nf.test
deleted file mode 100644
index 70edae4..0000000
--- a/modules/nf-core/fastqc/tests/main.nf.test
+++ /dev/null
@@ -1,212 +0,0 @@
-nextflow_process {
-
-    name "Test Process FASTQC"
-    script "../main.nf"
-    process "FASTQC"
-
-    tag "modules"
-    tag "modules_nfcore"
-    tag "fastqc"
-
-    test("sarscov2 single-end [fastq]") {
-
-        when {
-            process {
-                """
-                input[0] = Channel.of([
-                    [ id: 'test', single_end:true ],
-                    [ file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_1.fastq.gz', checkIfExists: true) ]
-                ])
-                """
-            }
-        }
-
-        then {
-            assertAll (
-            { assert process.success },
-
-            // NOTE The report contains the date inside it, which means that the md5sum is stable per day, but not longer than that. So you can't md5sum it.
-            // looks like this: <div id="header_filename">Mon 2 Oct 2023<br/>test.gz</div>
-            // https://github.com/nf-core/modules/pull/3903#issuecomment-1743620039
-
-            { assert process.out.html[0][1] ==~ ".*/test_fastqc.html" },
-            { assert process.out.zip[0][1] ==~ ".*/test_fastqc.zip" },
-            { assert path(process.out.html[0][1]).text.contains("<tr><td>File type</td><td>Conventional base calls</td></tr>") },
-
-            { assert snapshot(process.out.versions).match("fastqc_versions_single") }
-            )
-        }
-    }
-
-    test("sarscov2 paired-end [fastq]") {
-
-        when {
-            process {
-                """
-                input[0] = Channel.of([
-                    [id: 'test', single_end: false], // meta map
-                    [ file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_1.fastq.gz', checkIfExists: true),
-                    file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_2.fastq.gz', checkIfExists: true) ]
-                ])
-                """
-            }
-        }
-
-        then {
-            assertAll (
-            { assert process.success },
-
-            { assert process.out.html[0][1][0] ==~ ".*/test_1_fastqc.html" },
-            { assert process.out.html[0][1][1] ==~ ".*/test_2_fastqc.html" },
-            { assert process.out.zip[0][1][0] ==~ ".*/test_1_fastqc.zip" },
-            { assert process.out.zip[0][1][1] ==~ ".*/test_2_fastqc.zip" },
-            { assert path(process.out.html[0][1][0]).text.contains("<tr><td>File type</td><td>Conventional base calls</td></tr>") },
-            { assert path(process.out.html[0][1][1]).text.contains("<tr><td>File type</td><td>Conventional base calls</td></tr>") },
-
-            { assert snapshot(process.out.versions).match("fastqc_versions_paired") }
-            )
-        }
-    }
-
-    test("sarscov2 interleaved [fastq]") {
-
-        when {
-            process {
-                """
-                input[0] = Channel.of([
-                    [id: 'test', single_end: false], // meta map
-                    file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_interleaved.fastq.gz', checkIfExists: true)
-                ])
-            """
-            }
-        }
-
-        then {
-            assertAll (
-            { assert process.success },
-
-            { assert process.out.html[0][1] ==~ ".*/test_fastqc.html" },
-            { assert process.out.zip[0][1] ==~ ".*/test_fastqc.zip" },
-            { assert path(process.out.html[0][1]).text.contains("<tr><td>File type</td><td>Conventional base calls</td></tr>") },
-
-            { assert snapshot(process.out.versions).match("fastqc_versions_interleaved") }
-            )
-        }
-    }
-
-    test("sarscov2 paired-end [bam]") {
-
-        when {
-            process {
-                """
-                input[0] = Channel.of([
-                    [id: 'test', single_end: false], // meta map
-                    file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/bam/test.paired_end.sorted.bam', checkIfExists: true)
-                ])
-                """
-            }
-        }
-
-        then {
-            assertAll (
-            { assert process.success },
-
-            { assert process.out.html[0][1] ==~ ".*/test_fastqc.html" },
-            { assert process.out.zip[0][1] ==~ ".*/test_fastqc.zip" },
-            { assert path(process.out.html[0][1]).text.contains("<tr><td>File type</td><td>Conventional base calls</td></tr>") },
-
-            { assert snapshot(process.out.versions).match("fastqc_versions_bam") }
-            )
-        }
-    }
-
-    test("sarscov2 multiple [fastq]") {
-
-        when {
-            process {
-                """
-                input[0] = Channel.of([
-                    [id: 'test', single_end: false], // meta map
-                    [ file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_1.fastq.gz', checkIfExists: true),
-                    file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_2.fastq.gz', checkIfExists: true),
-                    file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test2_1.fastq.gz', checkIfExists: true),
-                    file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test2_2.fastq.gz', checkIfExists: true) ]
-                ])
-                """
-            }
-        }
-
-        then {
-            assertAll (
-            { assert process.success },
-
-            { assert process.out.html[0][1][0] ==~ ".*/test_1_fastqc.html" },
-            { assert process.out.html[0][1][1] ==~ ".*/test_2_fastqc.html" },
-            { assert process.out.html[0][1][2] ==~ ".*/test_3_fastqc.html" },
-            { assert process.out.html[0][1][3] ==~ ".*/test_4_fastqc.html" },
-            { assert process.out.zip[0][1][0] ==~ ".*/test_1_fastqc.zip" },
-            { assert process.out.zip[0][1][1] ==~ ".*/test_2_fastqc.zip" },
-            { assert process.out.zip[0][1][2] ==~ ".*/test_3_fastqc.zip" },
-            { assert process.out.zip[0][1][3] ==~ ".*/test_4_fastqc.zip" },
-            { assert path(process.out.html[0][1][0]).text.contains("<tr><td>File type</td><td>Conventional base calls</td></tr>") },
-            { assert path(process.out.html[0][1][1]).text.contains("<tr><td>File type</td><td>Conventional base calls</td></tr>") },
-            { assert path(process.out.html[0][1][2]).text.contains("<tr><td>File type</td><td>Conventional base calls</td></tr>") },
-            { assert path(process.out.html[0][1][3]).text.contains("<tr><td>File type</td><td>Conventional base calls</td></tr>") },
-
-            { assert snapshot(process.out.versions).match("fastqc_versions_multiple") }
-            )
-        }
-    }
-
-    test("sarscov2 custom_prefix") {
-
-        when {
-            process {
-                """
-                input[0] = Channel.of([
-                    [ id:'mysample', single_end:true ], // meta map
-                    file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_1.fastq.gz', checkIfExists: true)
-                ])
-                """
-            }
-        }
-
-        then {
-            assertAll (
-            { assert process.success },
-
-            { assert process.out.html[0][1] ==~ ".*/mysample_fastqc.html" },
-            { assert process.out.zip[0][1] ==~ ".*/mysample_fastqc.zip" },
-            { assert path(process.out.html[0][1]).text.contains("<tr><td>File type</td><td>Conventional base calls</td></tr>") },
-
-            { assert snapshot(process.out.versions).match("fastqc_versions_custom_prefix") }
-            )
-        }
-    }
-
-    test("sarscov2 single-end [fastq] - stub") {
-
-        options "-stub"
-
-        when {
-            process {
-                """
-                input[0] = Channel.of([
-                    [ id: 'test', single_end:true ],
-                    [ file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastq/test_1.fastq.gz', checkIfExists: true) ]
-                ])
-                """
-            }
-        }
-
-        then {
-            assertAll (
-            { assert process.success },
-            { assert snapshot(process.out.html.collect { file(it[1]).getName() } +
-                                process.out.zip.collect { file(it[1]).getName() } +
-                                process.out.versions ).match("fastqc_stub") }
-            )
-        }
-    }
-
-}
diff --git a/modules/nf-core/fastqc/tests/main.nf.test.snap b/modules/nf-core/fastqc/tests/main.nf.test.snap
deleted file mode 100644
index 86f7c31..0000000
--- a/modules/nf-core/fastqc/tests/main.nf.test.snap
+++ /dev/null
@@ -1,88 +0,0 @@
-{
-    "fastqc_versions_interleaved": {
-        "content": [
-            [
-                "versions.yml:md5,e1cc25ca8af856014824abd842e93978"
-            ]
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-01-31T17:40:07.293713"
-    },
-    "fastqc_stub": {
-        "content": [
-            [
-                "test.html",
-                "test.zip",
-                "versions.yml:md5,e1cc25ca8af856014824abd842e93978"
-            ]
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-01-31T17:31:01.425198"
-    },
-    "fastqc_versions_multiple": {
-        "content": [
-            [
-                "versions.yml:md5,e1cc25ca8af856014824abd842e93978"
-            ]
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-01-31T17:40:55.797907"
-    },
-    "fastqc_versions_bam": {
-        "content": [
-            [
-                "versions.yml:md5,e1cc25ca8af856014824abd842e93978"
-            ]
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-01-31T17:40:26.795862"
-    },
-    "fastqc_versions_single": {
-        "content": [
-            [
-                "versions.yml:md5,e1cc25ca8af856014824abd842e93978"
-            ]
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-01-31T17:39:27.043675"
-    },
-    "fastqc_versions_paired": {
-        "content": [
-            [
-                "versions.yml:md5,e1cc25ca8af856014824abd842e93978"
-            ]
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-01-31T17:39:47.584191"
-    },
-    "fastqc_versions_custom_prefix": {
-        "content": [
-            [
-                "versions.yml:md5,e1cc25ca8af856014824abd842e93978"
-            ]
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-01-31T17:41:14.576531"
-    }
-}
\ No newline at end of file
diff --git a/modules/nf-core/fastqc/tests/tags.yml b/modules/nf-core/fastqc/tests/tags.yml
deleted file mode 100644
index 7834294..0000000
--- a/modules/nf-core/fastqc/tests/tags.yml
+++ /dev/null
@@ -1,2 +0,0 @@
-fastqc:
-  - modules/nf-core/fastqc/**
diff --git a/modules/nf-core/merquryfk/merquryfk/main.nf b/modules/nf-core/merquryfk/merquryfk/main.nf
index ac163da..f0e78cc 100644
--- a/modules/nf-core/merquryfk/merquryfk/main.nf
+++ b/modules/nf-core/merquryfk/merquryfk/main.nf
@@ -39,11 +39,16 @@ process MERQURYFK_MERQURYFK {
     prefix = task.ext.prefix ?: "${meta.id}"
     def FASTK_VERSION = 'f18a4e6d2207539f7b84461daebc54530a9559b0' // WARN: Version information not provided by tool on CLI. Please update this string when bumping container versions.
     def MERQURY_VERSION = '8ae344092df5dcaf83cfb7f90f662597a9b1fc61' // WARN: Version information not provided by tool on CLI. Please update this string when bumping container versions.
+
+    // Passing in the link through FASTK works, however passing in through YAML_INPUT results in being unable to find file
+    // seems as though it is because it is in a folder rather directly in the folder merqury is running in.
     """
+    cp ${fastk_ktab}/*ktab . && cp ${fastk_ktab}/.*ktab.* .
+
     MerquryFK \\
         $args \\
         -T$task.cpus \\
-        ${fastk_ktab.find{ it.toString().endsWith(".ktab") }} \\
+        *.ktab \\
         $assembly \\
         $haplotigs \\
         $prefix
diff --git a/modules/nf-core/merquryfk/merquryfk/merquryfk-merquryfk.diff b/modules/nf-core/merquryfk/merquryfk/merquryfk-merquryfk.diff
new file mode 100644
index 0000000..751b30b
--- /dev/null
+++ b/modules/nf-core/merquryfk/merquryfk/merquryfk-merquryfk.diff
@@ -0,0 +1,23 @@
+Changes in module 'nf-core/merquryfk/merquryfk'
+--- modules/nf-core/merquryfk/merquryfk/main.nf
++++ modules/nf-core/merquryfk/merquryfk/main.nf
+@@ -39,11 +39,16 @@
+     prefix = task.ext.prefix ?: "${meta.id}"
+     def FASTK_VERSION = 'f18a4e6d2207539f7b84461daebc54530a9559b0' // WARN: Version information not provided by tool on CLI. Please update this string when bumping container versions.
+     def MERQURY_VERSION = '8ae344092df5dcaf83cfb7f90f662597a9b1fc61' // WARN: Version information not provided by tool on CLI. Please update this string when bumping container versions.
++
++    // Passing in the link through FASTK works, however passing in through YAML_INPUT results in being unable to find file
++    // seems as though it is because it is in a folder rather directly in the folder merqury is running in.
+     """
++    cp ${fastk_ktab}/*ktab . && cp ${fastk_ktab}/.*ktab.* .
++
+     MerquryFK \\
+         $args \\
+         -T$task.cpus \\
+-        ${fastk_ktab.find{ it.toString().endsWith(".ktab") }} \\
++        *.ktab \\
+         $assembly \\
+         $haplotigs \\
+         $prefix
+
+************************************************************
diff --git a/modules/nf-core/multiqc/environment.yml b/modules/nf-core/multiqc/environment.yml
deleted file mode 100644
index ca39fb6..0000000
--- a/modules/nf-core/multiqc/environment.yml
+++ /dev/null
@@ -1,7 +0,0 @@
-name: multiqc
-channels:
-  - conda-forge
-  - bioconda
-  - defaults
-dependencies:
-  - bioconda::multiqc=1.21
diff --git a/modules/nf-core/multiqc/main.nf b/modules/nf-core/multiqc/main.nf
deleted file mode 100644
index 47ac352..0000000
--- a/modules/nf-core/multiqc/main.nf
+++ /dev/null
@@ -1,55 +0,0 @@
-process MULTIQC {
-    label 'process_single'
-
-    conda "${moduleDir}/environment.yml"
-    container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ?
-        'https://depot.galaxyproject.org/singularity/multiqc:1.21--pyhdfd78af_0' :
-        'biocontainers/multiqc:1.21--pyhdfd78af_0' }"
-
-    input:
-    path  multiqc_files, stageAs: "?/*"
-    path(multiqc_config)
-    path(extra_multiqc_config)
-    path(multiqc_logo)
-
-    output:
-    path "*multiqc_report.html", emit: report
-    path "*_data"              , emit: data
-    path "*_plots"             , optional:true, emit: plots
-    path "versions.yml"        , emit: versions
-
-    when:
-    task.ext.when == null || task.ext.when
-
-    script:
-    def args = task.ext.args ?: ''
-    def config = multiqc_config ? "--config $multiqc_config" : ''
-    def extra_config = extra_multiqc_config ? "--config $extra_multiqc_config" : ''
-    def logo = multiqc_logo ? /--cl-config 'custom_logo: "${multiqc_logo}"'/ : ''
-    """
-    multiqc \\
-        --force \\
-        $args \\
-        $config \\
-        $extra_config \\
-        $logo \\
-        .
-
-    cat <<-END_VERSIONS > versions.yml
-    "${task.process}":
-        multiqc: \$( multiqc --version | sed -e "s/multiqc, version //g" )
-    END_VERSIONS
-    """
-
-    stub:
-    """
-    mkdir multiqc_data
-    touch multiqc_plots
-    touch multiqc_report.html
-
-    cat <<-END_VERSIONS > versions.yml
-    "${task.process}":
-        multiqc: \$( multiqc --version | sed -e "s/multiqc, version //g" )
-    END_VERSIONS
-    """
-}
diff --git a/modules/nf-core/multiqc/meta.yml b/modules/nf-core/multiqc/meta.yml
deleted file mode 100644
index 45a9bc3..0000000
--- a/modules/nf-core/multiqc/meta.yml
+++ /dev/null
@@ -1,58 +0,0 @@
-name: multiqc
-description: Aggregate results from bioinformatics analyses across many samples into a single report
-keywords:
-  - QC
-  - bioinformatics tools
-  - Beautiful stand-alone HTML report
-tools:
-  - multiqc:
-      description: |
-        MultiQC searches a given directory for analysis logs and compiles a HTML report.
-        It's a general use tool, perfect for summarising the output from numerous bioinformatics tools.
-      homepage: https://multiqc.info/
-      documentation: https://multiqc.info/docs/
-      licence: ["GPL-3.0-or-later"]
-input:
-  - multiqc_files:
-      type: file
-      description: |
-        List of reports / files recognised by MultiQC, for example the html and zip output of FastQC
-  - multiqc_config:
-      type: file
-      description: Optional config yml for MultiQC
-      pattern: "*.{yml,yaml}"
-  - extra_multiqc_config:
-      type: file
-      description: Second optional config yml for MultiQC. Will override common sections in multiqc_config.
-      pattern: "*.{yml,yaml}"
-  - multiqc_logo:
-      type: file
-      description: Optional logo file for MultiQC
-      pattern: "*.{png}"
-output:
-  - report:
-      type: file
-      description: MultiQC report file
-      pattern: "multiqc_report.html"
-  - data:
-      type: directory
-      description: MultiQC data dir
-      pattern: "multiqc_data"
-  - plots:
-      type: file
-      description: Plots created by MultiQC
-      pattern: "*_data"
-  - versions:
-      type: file
-      description: File containing software versions
-      pattern: "versions.yml"
-authors:
-  - "@abhi18av"
-  - "@bunop"
-  - "@drpatelh"
-  - "@jfy133"
-maintainers:
-  - "@abhi18av"
-  - "@bunop"
-  - "@drpatelh"
-  - "@jfy133"
diff --git a/modules/nf-core/multiqc/tests/main.nf.test b/modules/nf-core/multiqc/tests/main.nf.test
deleted file mode 100644
index f1c4242..0000000
--- a/modules/nf-core/multiqc/tests/main.nf.test
+++ /dev/null
@@ -1,84 +0,0 @@
-nextflow_process {
-
-    name "Test Process MULTIQC"
-    script "../main.nf"
-    process "MULTIQC"
-
-    tag "modules"
-    tag "modules_nfcore"
-    tag "multiqc"
-
-    test("sarscov2 single-end [fastqc]") {
-
-        when {
-            process {
-                """
-                input[0] = Channel.of(file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastqc/test_fastqc.zip', checkIfExists: true))
-                input[1] = []
-                input[2] = []
-                input[3] = []
-                """
-            }
-        }
-
-        then {
-            assertAll(
-                { assert process.success },
-                { assert process.out.report[0] ==~ ".*/multiqc_report.html" },
-                { assert process.out.data[0] ==~ ".*/multiqc_data" },
-                { assert snapshot(process.out.versions).match("multiqc_versions_single") }
-            )
-        }
-
-    }
-
-    test("sarscov2 single-end [fastqc] [config]") {
-
-        when {
-            process {
-                """
-                input[0] = Channel.of(file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastqc/test_fastqc.zip', checkIfExists: true))
-                input[1] = Channel.of(file("https://github.com/nf-core/tools/raw/dev/nf_core/pipeline-template/assets/multiqc_config.yml", checkIfExists: true))
-                input[2] = []
-                input[3] = []
-                """
-            }
-        }
-
-        then {
-            assertAll(
-                { assert process.success },
-                { assert process.out.report[0] ==~ ".*/multiqc_report.html" },
-                { assert process.out.data[0] ==~ ".*/multiqc_data" },
-                { assert snapshot(process.out.versions).match("multiqc_versions_config") }
-            )
-        }
-    }
-
-    test("sarscov2 single-end [fastqc] - stub") {
-
-        options "-stub"
-
-        when {
-            process {
-                """
-                input[0] = Channel.of(file(params.modules_testdata_base_path + 'genomics/sarscov2/illumina/fastqc/test_fastqc.zip', checkIfExists: true))
-                input[1] = []
-                input[2] = []
-                input[3] = []
-                """
-            }
-        }
-
-        then {
-            assertAll(
-                { assert process.success },
-                { assert snapshot(process.out.report.collect { file(it).getName() } +
-                                process.out.data.collect { file(it).getName() } +
-                                process.out.plots.collect { file(it).getName() } +
-                                process.out.versions ).match("multiqc_stub") }
-            )
-        }
-
-    }
-}
diff --git a/modules/nf-core/multiqc/tests/main.nf.test.snap b/modules/nf-core/multiqc/tests/main.nf.test.snap
deleted file mode 100644
index bfebd80..0000000
--- a/modules/nf-core/multiqc/tests/main.nf.test.snap
+++ /dev/null
@@ -1,41 +0,0 @@
-{
-    "multiqc_versions_single": {
-        "content": [
-            [
-                "versions.yml:md5,21f35ee29416b9b3073c28733efe4b7d"
-            ]
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-02-29T08:48:55.657331"
-    },
-    "multiqc_stub": {
-        "content": [
-            [
-                "multiqc_report.html",
-                "multiqc_data",
-                "multiqc_plots",
-                "versions.yml:md5,21f35ee29416b9b3073c28733efe4b7d"
-            ]
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-02-29T08:49:49.071937"
-    },
-    "multiqc_versions_config": {
-        "content": [
-            [
-                "versions.yml:md5,21f35ee29416b9b3073c28733efe4b7d"
-            ]
-        ],
-        "meta": {
-            "nf-test": "0.8.4",
-            "nextflow": "23.10.1"
-        },
-        "timestamp": "2024-02-29T08:49:25.457567"
-    }
-}
\ No newline at end of file
diff --git a/modules/nf-core/multiqc/tests/tags.yml b/modules/nf-core/multiqc/tests/tags.yml
deleted file mode 100644
index bea6c0d..0000000
--- a/modules/nf-core/multiqc/tests/tags.yml
+++ /dev/null
@@ -1,2 +0,0 @@
-multiqc:
-  - modules/nf-core/multiqc/**
diff --git a/nextflow.config b/nextflow.config
index 3fb2d75..e39cd2f 100644
--- a/nextflow.config
+++ b/nextflow.config
@@ -12,6 +12,7 @@ params {
     // TODO nf-core: Specify your pipeline's command line flags
     // Input options
     input                        = null
+    mapped                       = false
 
     // Boilerplate options
     outdir                       = null
diff --git a/nextflow_schema.json b/nextflow_schema.json
index 55b26b3..f198603 100644
--- a/nextflow_schema.json
+++ b/nextflow_schema.json
@@ -20,7 +20,7 @@
                     "mimetype": "text/yaml",
                     "pattern": "^\\S+\\.yaml$",
                     "description": "Path to yaml file containing information about the samples in the experiment.",
-                    "help_text": "You will need to create a design file with information about the samples in your experiment before running the pipeline. Use this parameter to specify its location. It has to be a comma-separated file with 3 columns, and a header row.",
+                    "help_text": "You will need to create a yaml file which contains data on the sample at hand",
                     "fa_icon": "fas fa-file-yaml"
                 },
                 "outdir": {
diff --git a/subworkflows/local/main_mapping.nf b/subworkflows/local/main_mapping.nf
new file mode 100644
index 0000000..28c100f
--- /dev/null
+++ b/subworkflows/local/main_mapping.nf
@@ -0,0 +1,77 @@
+include { SE_MAPPING        } from './se_mapping'
+include { PE_MAPPING        } from './pe_mapping'
+
+include { SAMTOOLS_SORT     } from '../../modules/nf-core/samtools/sort/main'
+
+
+workflow MAIN_MAPPING {
+
+    take:
+    sample_id               // val(sample_id)
+    platform                // val(data_type)
+    reference_hap1          // tuple val(meta), path(reference)
+    pacbio_tuple            // tuple val(meta), path(longread_path)
+
+    main:
+    ch_align_bam    = Channel.empty()
+    ch_versions     = Channel.empty()
+
+    //
+    // LOGIC: SANGER-TOL/BLOBTOOLKIT expects the pacbio data to be already mapped -> this has been changed but seeing as BTK and genomenote need it then we may as well keep it.
+    //          This is also a requirement for genomenote
+    //
+
+    if ( platform.filter { it == "hifi" } || platform.filter { it == "clr" } || platform.filter { it == "ont" } ) {
+        //
+        // SUBWORKFLOW: SINGLE END MAPPING FOR ALIGNING LONGREAD DATA
+        //
+        SE_MAPPING (
+            reference_hap1,
+            pacbio_tuple,
+            platform
+        )
+        ch_versions = ch_versions.mix(SE_MAPPING.out.versions)
+
+        ch_align_bam
+            .mix( SE_MAPPING.out.mapped_bam )
+            .set { merged_bam }
+    }
+    else if ( platform.filter { it == "illumina" } ) {
+        //
+        // SUBWORKFLOW: PAIRED END MAPPING FOR ALIGNING LONGREAD DATA
+        //
+        PE_MAPPING  (
+            reference_hap1,
+            pacbio_tuple,
+            platform
+        )
+        ch_versions = ch_versions.mix(PE_MAPPING.out.versions)
+
+        ch_align_bam
+            .mix( PE_MAPPING.out.mapped_bam )
+            .set { merged_bam }
+    }
+
+    //
+    // MODULE: SORT MAPPED BAM
+    //
+    SAMTOOLS_SORT (
+        merged_bam,
+        reference_hap1
+    )
+    ch_versions = ch_versions.mix( SAMTOOLS_SORT.out.versions )
+
+    sample_id
+        .combine(merged_bam)
+        .map{ sample_id, pacbio_meta, pacbio_path ->
+            tuple(  [id: sample_id],
+                    pacbio_path
+            )
+        }
+        .set { mapped_bam }
+
+    emit:
+    mapped_bam                        // channel: tuple val(meta), path(mapped_bam)
+    versions       = ch_versions      // channel: [ path(versions.yml) ]
+
+}
\ No newline at end of file
diff --git a/subworkflows/local/yaml_input.nf b/subworkflows/local/yaml_input.nf
index 687c5db..916c003 100644
--- a/subworkflows/local/yaml_input.nf
+++ b/subworkflows/local/yaml_input.nf
@@ -4,7 +4,7 @@ import groovy.yaml.YamlSlurper
 
 workflow YAML_INPUT {
     take:
-    input_file          // params.input
+    input_file                  // params.input
 
     main:
     ch_versions                 = Channel.empty()
@@ -58,44 +58,61 @@ workflow YAML_INPUT {
         }
         .set {cpretext_hic_dir}
 
+
+    if (params.mapped) {
+        bam_path = Channel.of(inputs.mapped_bam)
+
+        sample_id
+            .combine(bam_path)
+            .map{ sample, dir ->
+                tuple([id: sample],
+                    dir
+                )
+            }
+            .set {mapped_bam}
+    } else {
+        mapped_bam = [[],[]]
+    }
+
     emit:
     //
     // LOGIC: Building generic channels
     //
     sample_id
-    longread_type                                               // val(data)
-    longread_dir            = inputs.longread.dir               // DataVariable
-    pacbio_tuple                                                // tuple (meta), path(file)
-    reference_hap1          = reference_hap1                    // tuple (meta), path(file)
-    reference_hap2          = reference_2                       // DataVariable
-    reference_path          = inputs.reference_hap1             // DataVariable
+    longread_type                                                   // val(data)
+    longread_dir                = inputs.longread.dir               // DataVariable
+    pacbio_tuple                                                    // tuple (meta), path(file)
+    reference_hap1                                                  // tuple (meta), path(file)
+    reference_hap2              = reference_2                       // DataVariable
+    reference_path              = inputs.reference_hap1             // DataVariable
+    mapped_bam
 
     //
     // LOGIC: Building CurationPretext specific channels
     //
     cpretext_aligner
     cpretext_telomere_motif
-    cpretext_hic_dir_raw    = inputs.curationpretext.hic_dir    // DataVariable
+    cpretext_hic_dir_raw        = inputs.curationpretext.hic_dir    // DataVariable
 
     //
     // LOGIC: MERQURY CHANNELS
     //
-    fastk_hist              = Channel.of(inputs.merquryfk.fastk_hist)
-    fastk_ktab              = Channel.of(inputs.merquryfk.fastk_ktab)
+    fastk_hist                  = Channel.fromPath(inputs.merquryfk.fastk_hist)
+    fastk_ktab                  = Channel.fromPath(inputs.merquryfk.fastk_ktab, hidden: true)
 
     //
     // LOGIC: Building BlobToolKit specific channels
     //
-    btk_nt_database         = Channel.of(inputs.btk.nt_database)
-    btk_nt_database_prefix  = Channel.of(inputs.btk.nt_database_prefix)
-    btk_nt_diamond_database = Channel.of(inputs.btk.diamond_nr_database_path)
-    btk_un_diamond_database = Channel.of(inputs.btk.diamond_uniprot_database_path)
-    btk_ncbi_taxonomy_path  = Channel.of(inputs.btk.ncbi_taxonomy_path)
-    btk_ncbi_lineage_path   = Channel.of(inputs.btk.ncbi_rankedlineage_path)
-    btk_yaml                = Channel.of(inputs.btk.btk_yaml)
-    btk_taxid               = Channel.of(inputs.btk.taxid)
-    btk_gca_accession       = Channel.of(inputs.btk.gca_accession)
-    busco_lineages          = Channel.of(inputs.btk.lineages)
-
-    versions                = ch_versions.ifEmpty(null)
+    btk_nt_database             = Channel.of(inputs.btk.nt_database)
+    btk_nt_database_prefix      = Channel.of(inputs.btk.nt_database_prefix)
+    btk_nt_diamond_database     = Channel.of(inputs.btk.diamond_nr_database_path)
+    btk_un_diamond_database     = Channel.of(inputs.btk.diamond_uniprot_database_path)
+    btk_ncbi_taxonomy_path      = Channel.of(inputs.btk.ncbi_taxonomy_path)
+    btk_ncbi_lineage_path       = Channel.of(inputs.btk.ncbi_rankedlineage_path)
+    btk_taxid                   = Channel.of(inputs.btk.taxid)
+    btk_gca_accession           = Channel.of(inputs.btk.gca_accession)
+    busco_lineages              = Channel.of(inputs.btk.lineages)
+    btk_config                  = Channel.fromPath(inputs.btk.config)
+
+    versions                    = ch_versions.ifEmpty(null)
 }
diff --git a/workflows/ear.nf b/workflows/ear.nf
index 9f90920..1c93b33 100644
--- a/workflows/ear.nf
+++ b/workflows/ear.nf
@@ -4,17 +4,20 @@
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 */
 
-include { NEXTFLOW_RUN as CURATIONPRETEXT   } from '../modules/local/nextflow/run'
-include { NEXTFLOW_RUN as BLOBTOOLKIT       } from '../modules/local/nextflow/run'
+// Subpipeline imports
 include { SANGER_TOL_BTK                    } from '../modules/local/sanger_tol_btk'
+include { SANGER_TOL_CPRETEXT               } from '../modules/local/sanger_tol_cpretext'
 
+// Subworkflow imports
 include { YAML_INPUT                        } from '../subworkflows/local/yaml_input'
+include { MAIN_MAPPING                      } from '../subworkflows/local/main_mapping'
+
+// Module imports
 include { GENERATE_SAMPLESHEET              } from '../modules/local/generate_samplesheet'
 include { GFASTATS                          } from '../modules/nf-core/gfastats/main'
-include { PE_MAPPING                        } from '../subworkflows/local/pe_mapping'
-include { SE_MAPPING                        } from '../subworkflows/local/se_mapping'
-include { SAMTOOLS_SORT                     } from '../modules/nf-core/samtools/sort/main'
+include { MERQURYFK_MERQURYFK               } from '../modules/nf-core/merquryfk/merquryfk/main'
 
+// Plugin imports
 include { paramsSummaryMap                  } from 'plugin/nf-validation'
 include { paramsSummaryMultiqc              } from '../subworkflows/nf-core/utils_nfcore_pipeline'
 include { softwareVersionsToYAML            } from '../subworkflows/nf-core/utils_nfcore_pipeline'
@@ -32,45 +35,21 @@ workflow EAR {
     ch_input
 
     main:
-
+    params.mapped   = false
     ch_versions     = Channel.empty()
     ch_align_bam    = Channel.empty()
 
+
     //
     // MODULE: YAML_INPUT
+    //          - YAML_INPUT SHOULD BE REWORKED TO BE SMARTER
     //
     YAML_INPUT(ch_input)
 
-    //
-    // MODULE: Run Sanger-ToL/CurationPretext
-    //         - This was built using: https://github.com/mahesh-panchal/nf-cascade
-    //
-    reference = YAML_INPUT.out.reference_path.get()
-    hic_dir = YAML_INPUT.out.cpretext_hic_dir_raw.get()
-    longread_dir = YAML_INPUT.out.longread_dir.get()
-
-    CURATIONPRETEXT(
-        "sanger-tol/curationpretext",
-        [
-            "-r 1.0.0",
-            "--input",
-            reference,
-            "--longread",
-            longread_dir,
-            "--cram",
-            hic_dir,
-            "-profile singularity,sanger"
-        ].join(" ").trim(), // workflow opts
-        Channel.value([]),  //readWithDefault( params.demo.params_file, Channel.value([]) ), // params file
-        Channel.value([]),  // samplesheet - not used by this pipeline
-        Channel.value([])   //readWithDefault( params.demo.add_config, Channel.value([]) ),  // custom config
-        //"$params.outdir/curationpretext",
-    )
 
     //
     // MODULE: ASSEMBLY STATISTICS FOR THE FASTA
     //
-
     GFASTATS(
         YAML_INPUT.out.reference_hap1,
         "fasta",
@@ -81,135 +60,102 @@ workflow EAR {
         [],
         []
     )
+    ch_versions = ch_versions.mix( GFASTATS.out.versions )
+
 
     //
     // LOGIC:  REFORMAT A BUNCH OF CHANNELS FOR MERQUERYFK
     //
+    YAML_INPUT.out.reference_hap1
+        .combine(YAML_INPUT.out.reference_hap2)
+        .combine(YAML_INPUT.out.fastk_hist)
+        .combine(YAML_INPUT.out.fastk_ktab)
+        .map{ meta, primary, haplotigs, fastk_hist, fastk_ktab ->
+            tuple(  meta,
+                    fastk_hist,
+                    fastk_ktab,
+                    primary,
+                    haplotigs
+            )
+        }
+        .set { merquryfk_input }
 
-    if (params.reference_hap2) {
-        YAML_INPUT.out.reference_hap1
-            .combine(YAML_INPUT.out.reference_hap2)
-            .combine(YAML_INPUT.out.fastk_hist)
-            .combine(YAML_INPUT.out.fastk_ktab)
-            .map{ meta, primary, haplotigs, fastk_hist, fastk_ktab ->
-                tuple(  meta,
-                        fastk_hist,
-                        fastk_ktab,
-                        primary,
-                        haplotigs
-                )
-            }
-            .set { merquryfk_input }
-
-        //
-        // MODULE: MERQURYFK PLOTS OF GENOME
-        //
-
-        MERQURYFK(
-            merquryfk_input
-        )
-    }
 
     //
-    // LOGIC: SANGER-TOL/BLOBTOOLKIT expects the pacbio data to be already mapped -> this has been changed but seeing as BTK and genomenote need it then we may as well keep it.
-    //          This is also a requirement for genomenote
+    // MODULE: MERQURYFK PLOTS OF GENOME
     //
-    platform = YAML_INPUT.out.longread_type
+    MERQURYFK_MERQURYFK(
+        merquryfk_input
+    )
+    ch_versions = ch_versions.mix( MERQURYFK_MERQURYFK.out.versions )
 
-    YAML_INPUT.out.sample_id
-        .combine(YAML_INPUT.out.longread_dir)
-        .map{ sample, dir ->
-            tuple([id: sample], dir )
-        }
-        .set {pacbio_tuple}
 
-    if ( platform.filter { it == "hifi" } || platform.filter { it == "clr" } || platform.filter { it == "ont" } ) {
+    //
+    // LOGIC: IF A MAPPED BAM FILE EXISTS AND THE FLAG `mapped` IS TRUE
+    //          SKIP THE MAPPING SUBWORKFLOW
+    //
+    if (!params.mapped) {
         //
-        // SUBWORKFLOW: SINGLE END MAPPING FOR ALIGNING LONGREAD DATA
+        // SUBWORKFLOW: MAIN_MAPPING CONTAINS ALL THE MAPPING LOGIC
+        //              This allows us to more esily bypass the mapping if we already have a sorted and mapped bam
         //
-        SE_MAPPING (
+        MAIN_MAPPING (
+            YAML_INPUT.out.sample_id,
+            YAML_INPUT.out.longread_type,
             YAML_INPUT.out.reference_hap1,
             YAML_INPUT.out.pacbio_tuple,
-            platform
         )
-        ch_versions = ch_versions.mix(SE_MAPPING.out.versions)
-
-        ch_align_bam
-            .mix( SE_MAPPING.out.mapped_bam )
-            .set { merged_bam }
+        ch_versions = ch_versions.mix( MAIN_MAPPING.out.versions )
+        ch_mapped_bam = MAIN_MAPPING.out.mapped_bam
+    } else {
+        ch_mapped_bam = YAML_INPUT.out.mapped_bam
     }
-    else if ( platform.filter { it == "illumina" } ) {
-        //
-        // SUBWORKFLOW: PAIRED END MAPPING FOR ALIGNING LONGREAD DATA
-        //
-        PE_MAPPING  (
-            YAML_INPUT.out.reference_hap1,
-            YAML_INPUT.out.pacbio_tuple,
-            platform
-        )
-        ch_versions = ch_versions.mix(PE_MAPPING.out.versions)
 
-        ch_align_bam
-            .mix( PE_MAPPING.out.mapped_bam )
-            .set { merged_bam }
-    }
-
-    //
-    // MODULE: SORT MAPPED BAM
-    //
-    SAMTOOLS_SORT (
-        merged_bam,
-        YAML_INPUT.out.reference_hap1
-    )
-    ch_versions = ch_versions.mix( SAMTOOLS_SORT.out.versions )
 
     //
     // MODULE: GENERATE_SAMPLESHEET creates a csv for the blobtoolkit pipeline
     //
-    YAML_INPUT.out.sample_id
-        .combine(merged_bam)
-        .map{ sample_id, pacbio_meta, pacbio_path ->
-            tuple(  [id: sample_id],
-                    pacbio_path
-            )
-        }
-        .set { mapped_bam }
-
-
     GENERATE_SAMPLESHEET(
-        mapped_bam
+        ch_mapped_bam
     )
     ch_versions = ch_versions.mix( GENERATE_SAMPLESHEET.out.versions )
 
+
     //
     // MODULE: Run Sanger-ToL/BlobToolKit
     //
-    YAML_INPUT.out.reference_hap1.view{ it -> "Reference: $it"}
-    mapped_bam.view{ it -> "samplesheet: $it"}
-    GENERATE_SAMPLESHEET.out.csv.view{ it -> "samplesheetcsv: $it"}
-    YAML_INPUT.out.btk_un_diamond_database.view{ it -> "un diamond: $it"}
-    YAML_INPUT.out.btk_nt_database.view{ it -> "nt diamond: $it"}
-    YAML_INPUT.out.btk_ncbi_taxonomy_path.view{ it -> "Taxdump: $it"}
-    YAML_INPUT.out.btk_yaml.view{ it -> "btk_yaml: $it"}
-    YAML_INPUT.out.busco_lineages.view{ it -> "lineages: $it"}
-    YAML_INPUT.out.btk_taxid.view{ it -> "TAXID: $it"}
-
     SANGER_TOL_BTK (
         YAML_INPUT.out.reference_hap1,
-        mapped_bam,
+        ch_mapped_bam,
         GENERATE_SAMPLESHEET.out.csv,
         YAML_INPUT.out.btk_un_diamond_database,
         YAML_INPUT.out.btk_nt_database,
         YAML_INPUT.out.btk_un_diamond_database,
-        [],
+        YAML_INPUT.out.btk_config,
         YAML_INPUT.out.btk_ncbi_taxonomy_path,
-        YAML_INPUT.out.btk_yaml,
         YAML_INPUT.out.busco_lineages,
         YAML_INPUT.out.btk_taxid,
         'GCA_0001'
     )
     ch_versions              = ch_versions.mix(SANGER_TOL_BTK.out.versions)
 
+
+    //
+    // MODULE: Run Sanger-ToL/CurationPretext
+    //
+    reference       = YAML_INPUT.out.reference_path.get()
+    hic_dir         = YAML_INPUT.out.cpretext_hic_dir_raw.get()
+    longread_dir    = YAML_INPUT.out.longread_dir.get()
+
+    SANGER_TOL_CPRETEXT(
+        reference,
+        longread_dir,
+        hic_dir,
+        []
+    )
+    ch_versions = ch_versions.mix( SANGER_TOL_CPRETEXT.out.versions )
+
+
     //
     // Collate and save software versions
     //
@@ -225,26 +171,10 @@ workflow EAR {
         workflow, parameters_schema: "nextflow_schema.json")
     ch_workflow_summary = Channel.value(paramsSummaryMultiqc(summary_params))
 
-
-
     emit:
     versions       = ch_versions                 // channel: [ path(versions.yml) ]
 }
 
-
-process RenameDatabase {
-    tag "Rename DMND Database"
-    executor 'local'
-
-    input:
-    db_path
-
-    output:
-    path "UN.dmnd"
-
-    "true"
-}
-
 /*
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
     THE END