nf-core
diff --git a/‎.github/workflows/ci.yml
+79-21 b/‎.github/workflows/ci.yml
+79-21
diff --git a/‎.gitignore
+1-1 b/‎.gitignore
+1-1
diff --git a/‎conf/modules.config
+3-3 b/‎conf/modules.config
+3-3
diff --git a/‎conf/tests/germline_small.config
+43 b/‎conf/tests/germline_small.config
+43
diff --git a/‎conf/tests/germline_sv.config
+44 b/‎conf/tests/germline_sv.config
+44
diff --git a/‎conf/tests/liftover_hg37.config
+41 b/‎conf/tests/liftover_hg37.config
+41
diff --git a/‎conf/tests/liftover_hg38.config
+41 b/‎conf/tests/liftover_hg38.config
+41
diff --git a/‎conf/tests/somatic_indel.config
+37 b/‎conf/tests/somatic_indel.config
+37
@@ -1,59 +1,117 @@
 name: nf-core CI
 # This workflow runs the pipeline with the minimal test dataset to check that it completes without any syntax errors
 on:
-  push:
+  pull_request:
     branches:
       - dev
-  pull_request:
+      - master
   release:
     types: [published]
   workflow_dispatch:
 
 env:
+  NFT_DIFF: "pdiff"
+  NFT_DIFF_ARGS: "--line-numbers --expand-tabs=2"
+  NFT_VER: "0.9.2"
+  NFT_WORKDIR: "~"
   NXF_ANSI_LOG: false
+  NXF_SINGULARITY_CACHEDIR: ${{ github.workspace }}/.singularity
+  NXF_SINGULARITY_LIBRARYDIR: ${{ github.workspace }}/.singularity
 
 concurrency:
   group: "${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}"
   cancel-in-progress: true
 
 jobs:
   test:
-    name: Run pipeline with test data
+    name: "${{ matrix.NXF_VER }} | ${{ matrix.profile }} | ${{ matrix.shard }}/6"
     # Only run on push if this is the nf-core dev branch (merged PRs)
-    if: "${{ github.event_name != 'push' || (github.event_name == 'push' && github.repository == 'nf-core/variantbenchmarking') }}"
+    if: "${{ github.event_name != 'push' || (github.event_name == 'push' && github.repository == 'nf-core/demultiplex') }}"
     runs-on: ubuntu-latest
     strategy:
+      fail-fast: false
       matrix:
         NXF_VER:
           - "24.04.2"
-          - "latest-everything"
+          - "latest-stable"
+        profile:
+          - "docker"
+          - "singularity"
+        isMaster:
+          - ${{ github.base_ref == 'master' }}
+        # Exclude conda and singularity on dev
+        exclude:
+          - isMaster: false
+            profile: "conda"
+          - isMaster: false
+            profile: "singularity"
+        shard: [1, 2, 3, 4, 5, 6]
     steps:
       - name: Check out pipeline code
         uses: actions/checkout@0ad4b8fadaa221de15dcec353f45205ec38ea70b # v4
+        with:
+          fetch-depth: 0
 
-      - name: Install Nextflow
+      - name: Set up Nextflow
         uses: nf-core/setup-nextflow@v2
         with:
           version: "${{ matrix.NXF_VER }}"
 
-      - name: Disk space cleanup
-        uses: jlumbroso/free-disk-space@54081f138730dfa15788a46383842cd2f914a1be # v1.3.1
+      - name: Set up Apptainer
+        if: matrix.profile == 'singularity'
+        uses: eWaterCycle/setup-apptainer@main
+
+      - name: Set up Singularity
+        if: matrix.profile == 'singularity'
+        run: |
+          mkdir -p $NXF_SINGULARITY_CACHEDIR
+          mkdir -p $NXF_SINGULARITY_LIBRARYDIR
+
+      - name: Set up Miniconda
+        if: matrix.profile == 'conda'
+        uses: conda-incubator/setup-miniconda@a4260408e20b96e80095f42ff7f1a15b27dd94ca # v3
+        with:
+          miniconda-version: "latest"
+          auto-update-conda: true
+          conda-solver: libmamba
+          channels: conda-forge,bioconda
 
-      - name: Run pipeline with test data for germline analysis (docker)
-        # TODO nf-core: You can customise CI pipeline run tests as required
-        # For example: adding multiple test runs with different parameters
-        # Remember that you can parallelise this by using strategy.matrix
+      - name: Set up Conda
+        if: matrix.profile == 'conda'
         run: |
-          nextflow run ${GITHUB_WORKSPACE} -profile test,docker --outdir ./results
+          echo $(realpath $CONDA)/condabin >> $GITHUB_PATH
+          echo $(realpath python) >> $GITHUB_PATH
 
-      - name: Run pipeline with test data (singularity)
-        # TODO nf-core: You can customise CI pipeline run tests as required
+      - name: Clean up Disk space
+        uses: jlumbroso/free-disk-space@54081f138730dfa15788a46383842cd2f914a1be # v1.3.1
+
+      - uses: actions/setup-python@v4
+        with:
+          python-version: "3.11"
+          architecture: "x64"
+
+      - name: Install pdiff to see diff between nf-test snapshots
         run: |
-          nextflow run ${GITHUB_WORKSPACE} -profile test,singularity --outdir ./results
-        if: "${{ github.base_ref == 'master' }}"
+          python -m pip install --upgrade pip
+          pip install pdiff
 
-      - name: Run pipeline with test data (conda)
-        # TODO nf-core: You can customise CI pipeline run tests as required
+      - uses: nf-core/setup-nf-test@v1
+        with:
+          version: ${{ env.NFT_VER }}
+
+      - name: Run Tests (Shard ${{ matrix.shard }}/6)
         run: |
-          nextflow run ${GITHUB_WORKSPACE} -profile test,conda --outdir ./results
-        if: "${{ github.base_ref == 'master' }}"
+          nf-test test \
+              --ci \
+              --shard ${{ matrix.shard }}/6 \
+              --changed-since HEAD^ \
+              --profile "+${{ matrix.profile }}" \
+              --filter pipeline \
+              --junitxml=test.xml
+
+      - name: Publish Test Report
+        uses: mikepenz/action-junit-report@v3
+        if: always() # always run even if the previous step fails
+        with:
+          report_paths: test.xml
+          annotate_only: true
@@ -13,4 +13,4 @@ null/*
 results*/*
 .nf-test/
 .nf-test.log
-
+test/.nf-test.log
@@ -39,7 +39,7 @@ process {
         ]
     }
     withName: SVYNC {
-        ext.prefix = {"${meta.id}.${meta.caller}"}
+        ext.prefix = {"${meta.id}.${meta.caller}.svync"}
         publishDir = [
             path: {"${params.outdir}/${params.variant_type}/${meta.id}/preprocess"},
             pattern: "*{.vcf.gz,vcf.gz.tbi}",
@@ -192,7 +192,7 @@ process {
         ]
     }
     withName: "HAPPY_PREPY" {
-        ext.prefix = {"${meta.id}.${params.truth_id}.${meta.caller}"}
+        ext.prefix = {"${meta.id}.${params.truth_id}.${meta.caller}.prepy"}
         ext.args   = {"--fixchr --filter-nonref --bcftools-norm"}
         publishDir = [
             path: {"${params.outdir}/${params.variant_type}/${meta.id}/preprocess"},
@@ -315,7 +315,7 @@ process {
         ]
     }
     withName: PICARD_LIFTOVERVCF {
-        ext.prefix = {"${meta.id}}"}
+        ext.prefix = {"${meta.id}"}
         ext.args = {"--WARN_ON_MISSING_CONTIG true"}
     }
     withName: BCFTOOLS_RENAME_CHR {
 
@@ -0,0 +1,43 @@
+/*
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+    Nextflow config file for running minimal tests
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+    Defines input files and everything required to run a fast and simple pipeline test.
+
+    Use as follows:
+        nextflow run nf-core/variantbenchmarking -profile test,<docker/singularity> --outdir <OUTDIR>
+
+----------------------------------------------------------------------------------------
+*/
+
+process {
+    resourceLimits = [
+        cpus: 4,
+        memory: '15.GB',
+        time: '1.h'
+    ]
+}
+
+params {
+    config_profile_name        = 'Test profile'
+    config_profile_description = 'Minimal test dataset to check pipeline function'
+
+    // Input data
+    input                = "https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/SV_testdata/samplesheet_small.csv"
+    outdir               = "results"
+
+    // Genome references
+    genome               = 'GRCh38'
+
+    // Processes
+    analysis             = 'germline'
+    variant_type         = "small"
+    method               = 'happy,rtgtools'
+    preprocess           = "normalization,deduplication,prepy"
+    include_expression   = 'FILTER="."'
+
+    // truth information
+    truth_id             = "HG002"
+    truth_vcf            = "https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/CRMG_benchmark_dataset/HG002_GRCh38_CMRG_smallvar_v1.00.vcf.gz"
+    regions_bed          = "https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/CRMG_benchmark_dataset/HG002_GRCh38_CMRG_smallvar_v1.00.bed"
+}
@@ -0,0 +1,44 @@
+/*
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+    Nextflow config file for running minimal tests
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+    Defines input files and everything required to run a fast and simple pipeline test.
+
+    Use as follows:
+        nextflow run nf-core/variantbenchmarking -profile test,<docker/singularity> --outdir <OUTDIR>
+
+----------------------------------------------------------------------------------------
+*/
+
+process {
+    resourceLimits = [
+        cpus: 4,
+        memory: '15.GB',
+        time: '1.h'
+    ]
+}
+
+params {
+    config_profile_name        = 'Test profile'
+    config_profile_description = 'Minimal test dataset to check pipeline function'
+
+    // Input data
+    input                = "https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/SV_testdata/samplesheet_sv.csv"
+    outdir               = "results"
+
+    // Genome references
+    genome               = 'GRCh38'
+
+    // Processes
+    analysis             = 'germline'
+    variant_type         = "structural"
+    method               = 'svanalyzer,wittyer,truvari'
+    preprocess           = "normalization,deduplication"
+    sv_standardization   = "svync,homogenize"
+    min_sv_size          = 30
+    truth_id             = "HG002"
+    include_expression   = 'FILTER="."'
+
+    truth_vcf            = "https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/SV_testdata/hg38/truth/HG002_GRCh38_difficult_medical_gene_SV_benchmark_v0.01.chr21.vcf.gz"
+    regions_bed          = "https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/SV_testdata/hg38/truth/HG002_GRCh38_difficult_medical_gene_SV_benchmark_v01.ch21.bed"
+}
@@ -0,0 +1,41 @@
+/*
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+    Nextflow config file for running minimal tests
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+    Defines input files and everything required to run a fast and simple pipeline test.
+
+    Use as follows:
+        nextflow run nf-core/benchmark -profile test_liftover,<docker/singularity> --outdir <OUTDIR>
+
+----------------------------------------------------------------------------------------
+*/
+
+params {
+    config_profile_name        = 'Test profile'
+    config_profile_description = 'Minimal test dataset to check pipeline function'
+
+    // Limit resources so that this can run on GitHub Actions
+    max_cpus              = 2
+    max_memory            = '6.5GB'
+    max_time              = '8.h'
+
+    // Input data
+    input                = 'https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/SV_testdata/samplesheet_sv_hg37.csv'
+    outdir               = 'results'
+    genome               = 'GRCh37'
+
+    // Processes
+    analysis             = 'germline'
+    variant_type         = "structural"
+    method               = 'truvari'
+    preprocess           = "normalization,deduplication,filter_contigs"
+    min_sv_size          = 30
+
+    truth_id             = "HG002"
+    truth_vcf            = "https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/SV_testdata/hg38/truth/HG002_GRCh38_difficult_medical_gene_SV_benchmark_v0.01.chr21.vcf.gz"
+
+    //liftover files
+    liftover              = true
+    chain                 = "http://ftp.ensembl.org/pub/assembly_mapping/homo_sapiens/GRCh38_to_GRCh37.chain.gz"
+    rename_chr            = "https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/SV_testdata/grch38_grch37.txt"
+}
@@ -0,0 +1,41 @@
+/*
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+    Nextflow config file for running minimal tests
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+    Defines input files and everything required to run a fast and simple pipeline test.
+
+    Use as follows:
+        nextflow run nf-core/benchmark -profile test_liftover,<docker/singularity> --outdir <OUTDIR>
+
+----------------------------------------------------------------------------------------
+*/
+
+params {
+    config_profile_name        = 'Test profile'
+    config_profile_description = 'Minimal test dataset to check pipeline function'
+
+    // Limit resources so that this can run on GitHub Actions
+    max_cpus              = 2
+    max_memory            = '6.5GB'
+    max_time              = '8.h'
+
+    // Input data
+    input                = 'https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/SV_testdata/samplesheet_small.csv'
+    outdir               = 'results'
+    genome               = 'GRCh38'
+
+    // Processes
+    analysis             = 'germline'
+    truth_id             = "HG002"
+    variant_type         = "small"
+    method               = 'rtgtools,happy'
+    preprocess           = "normalization,deduplication,filter_contigs"
+
+    truth_vcf            = "https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/SV_testdata/hg37/truth/HG002_GRCh37_1_22_v4.2.1_highconf.chr21.vcf.gz"
+    regions_bed          = "https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/SV_testdata/hg37/truth/HG002_GRCh37_1_22_v4.2.1_highconf.bed"
+
+    //liftover files
+    liftover             = true
+    chain                = "https://raw.githubusercontent.com/broadinstitute/gatk/master/scripts/funcotator/data_sources/gnomAD/b37ToHg38.over.chain"
+    rename_chr           = "https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/SV_testdata/grch37_grch38.txt"
+}
@@ -0,0 +1,37 @@
+/*
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+    Nextflow config file for running minimal tests
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+    Defines input files and everything required to run a fast and simple pipeline test.
+
+    Use as follows:
+        nextflow run nf-core/variantbenchmarking -profile test_somatic,<docker/singularity> --outdir <OUTDIR>
+
+----------------------------------------------------------------------------------------
+*/
+
+params {
+    config_profile_name        = 'Test profile'
+    config_profile_description = 'Minimal test dataset to check pipeline function'
+
+    // Limit resources so that this can run on GitHub Actions
+    max_cpus   = 2
+    max_memory = '6.5GB'
+    max_time   = '8.h'
+
+    // Input data
+    input           = 'https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/SV_testdata/samplesheet_somatic_indel.csv'
+    outdir          = 'results'
+
+    // Genome references
+    genome          = 'GRCh38'
+    analysis        = 'somatic'
+    truth_id        = "SEQC2"
+    method          = 'sompy'
+    preprocess      = "filter_contigs"
+    variant_type    = "indel"
+
+    truth_vcf       = "https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/somatic/truth/hg38/sINDEL_truth_set_v1.0.chr21.vcf.gz"
+    regions_bed     = "https://raw.githubusercontent.com/kubranarci/benchmark_datasets/main/somatic/truth/hg38/high-confidence_sINDEL_in_HC_regions_v1.2.chr21.vcf.gz"
+
+}
Original file line number	Diff line number	Diff line change
`@@ -39,7 +39,7 @@ process {`
`39`	`39`	`]`
`40`	`40`	`}`
`41`	`41`	`withName: SVYNC {`
`42`		`- ext.prefix = {"${meta.id}.${meta.caller}"}`
	`42`	`+ ext.prefix = {"${meta.id}.${meta.caller}.svync"}`
`43`	`43`	`publishDir = [`
`44`	`44`	`path: {"${params.outdir}/${params.variant_type}/${meta.id}/preprocess"},`
`45`	`45`	`pattern: "*{.vcf.gz,vcf.gz.tbi}",`
`@@ -192,7 +192,7 @@ process {`
`192`	`192`	`]`
`193`	`193`	`}`
`194`	`194`	`withName: "HAPPY_PREPY" {`
`195`		`- ext.prefix = {"${meta.id}.${params.truth_id}.${meta.caller}"}`
	`195`	`+ ext.prefix = {"${meta.id}.${params.truth_id}.${meta.caller}.prepy"}`
`196`	`196`	`ext.args = {"--fixchr --filter-nonref --bcftools-norm"}`
`197`	`197`	`publishDir = [`
`198`	`198`	`path: {"${params.outdir}/${params.variant_type}/${meta.id}/preprocess"},`
`@@ -315,7 +315,7 @@ process {`
`315`	`315`	`]`
`316`	`316`	`}`
`317`	`317`	`withName: PICARD_LIFTOVERVCF {`
`318`		`- ext.prefix = {"${meta.id}}"}`
	`318`	`+ ext.prefix = {"${meta.id}"}`
`319`	`319`	`ext.args = {"--WARN_ON_MISSING_CONTIG true"}`
`320`	`320`	`}`
`321`	`321`	`withName: BCFTOOLS_RENAME_CHR {`