nextflow_schema.json

{
  "$schema": "http://json-schema.org/draft-07/schema",
  "$id": "https://raw.githubusercontent.com/./main/nextflow_schema.json",
  "title": "artic-network/artic-mpxv-illumina-nf",
  "workflow_title": "Artic Network MPXV Illumina Analysis",
  "description": "Run Illumina MPXV amplicon sequencing bioinformatics",
  "demo_url": "",
  "aws_demo_url": "",
  "url": "https://github.com/artic-network/artic-mpxv-illumina-nf",
  "type": "object",
  "definitions": {
    "input": {
      "title": "Input Options",
      "type": "object",
      "fa_icon": "fas fa-arrow-right",
      "description": "Parameters for finding and handling input data for analysis.",
      "properties": {
        "directory": {
          "type": "string",
          "title": "FASTQ",
          "format": "path",
          "description": "FASTQ files to use in the analysis.",
          "help_text": "Directory containing the input FASTQ files"
        }
      },
      "required": [
        "directory"
      ]
    },
    "primer_scheme_selection": {
      "title": "Primer Scheme Selection",
      "type": "object",
      "fa_icon": "fas fa-code",
      "description": "Reference genome related files and options required for the workflow.",
      "properties": {
        "scheme_name": {
          "type": "string",
          "default": "artic-inrb-mpox/2500/v1.0.0",
          "description": "Primer scheme version.",
          "help_text": "Version of the primer scheme to use as described in the https://github.com/quick-lab/primerschemes/ repository.",
          "enum": [
            "artic-inrb-mpox/2500/v1.0.0",
            "artic-inrb-mpox/400/v1.0.0",
            "yale-mpox/2000/v1.0.0-cladei",
            "yale-mpox/2000/v1.0.0-cladeii",
            "bccdc-mpox/2500/v2.3.0"
          ]
        },
        "freetext_scheme_name": {
          "type": "string",
          "title": "Custom scheme",
          "description": "Custom primer scheme name.",
          "help_text": "If you wish to fetch a primer scheme from the primerschemes repository not listed above please enter it here, it must be in the format `scheme_name/scheme_length/version` as it appears in the https://github.com/quick-lab/primerschemes/ repository."
        },
        "custom_scheme": {
          "type": "string",
          "format": "path",
          "description": "Path to a custom scheme.",
          "help_text": "If you have a custom primer scheme you can enter the details here. This must be the full path to the directory containing your appropriately named scheme bed and fasta files; primer.bed and reference.fasta."
        }
      }
    },
    "output": {
      "title": "Output Options",
      "type": "object",
      "fa_icon": "fas fa-arrow-left",
      "description": "Parameters for saving and naming workflow outputs.",
      "properties": {
        "store_dir": {
          "type": "string",
          "format": "directory-path",
          "title": "Store directory name",
          "description": "Where to store the Hostile T2T reference files.",
          "help_text": "Hostile T2T reference files will be downloaded as part of the workflow and saved in this location, on subsequent runs it will use the same reference. If running through epi2me it is recommended to leave this as the default but if you are not this is required otherwise the pipeline will download lots of copies of the reference in your nextflow work directory.",
          "default": "store_dir"
        },
        "outdir": {
          "type": "string",
          "default": "output",
          "format": "directory-path",
          "description": "Directory for output of all workflow results."
        },
        "prefix": {
          "type": "string",
          "title": "Prefix",
          "description": "Prefix for output files.",
          "help_text": "Prefix for output files, Sequencing run name is a good choice e.g DDMMYY_MACHINEID_RUN_FLOWCELLID."
        }
      },
      "required": [
        "outdir",
        "prefix",
        "store_dir"
      ]
    },
    "squirrel_options": {
      "title": "Squirrel Options",
      "type": "object",
      "description": "Options related to running Squirrel",
      "properties": {
        "skip_squirrel": {
          "type": "boolean",
          "default": false,
          "title": "Skip Squirrel",
          "description": "Do not run alignment and QC pipeline",
          "help_text": ""
        },
        "clade": {
          "type": "string",
          "title": "Clade",
          "description": "Specify whether the sequencing run is primarily `cladeI` or `cladeII`.",
          "enum": [
            "cladei",
            "cladeia",
            "cladeib",
            "cladeii",
            "cladeiia",
            "cladeiib"
          ],
          "help_text": ""
        },
        "outgroups": {
          "type": "string",
          "title": "Outgroups",
          "hidden": true,
          "description": "Specify which MPXV outgroup(s) in the alignment to use in the phylogeny.",
          "help_text": "These are required by the phylogenetics module and will get pruned out from the final tree."
        },
        "squirrel_assembly_refs": {
          "type": "string",
          "format": "path",
          "title": "Assembly References",
          "hidden": true,
          "description": "References to check for `calls to reference` against, used only by the sequence QC process.",
          "help_text": ""
        }
      },
      "required": [
        "clade"
      ],
      "fa_icon": "fas fa-address-card",
      "help_text": ""
    },
    "resource_options": {
      "title": "Resource Options",
      "type": "object",
      "description": "Resource options for the workflow.",
      "properties": {
        "max_cpus": {
          "type": "integer",
          "title": "Max CPUs to use for a process",
          "default": 16,
          "description": "Max number of CPUs to use for a process."
        },
        "max_memory": {
          "type": "string",
          "title": "Memory",
          "default": "32.GB",
          "description": "Maximum possible amount of memory to use for the workflow. Must be in the format 32.GB"
        },
        "max_time": {
          "type": "string",
          "title": "Max time",
          "default": "12.h",
          "description": "Max time to run a process before timeout killing it. Must be in the format 12.h"
        }
      }
    },
    "advanced_options": {
      "title": "Advanced Options",
      "type": "object",
      "fa_icon": "far fa-question-circle",
      "description": "Advanced options for configuring processes inside the workflow.",
      "help_text": "These advanced options do not need to be changed for typical use, but allow fine tuning of workflows for users who want more control over the workflow.",
      "properties": {
        "skip_host_filter": {
          "type": "boolean",
          "title": "Skip host filtering",
          "default": false,
          "description": "Skip host filtering if you are not concerned about human contamination in your dataset."
        },
        "align_consensus": {
          "type": "boolean",
          "title": "Align consensus sequences to the provided reference.",
          "default": false,
          "description": "Align consensus sequences to the provided reference. With extremely low coverage sequences this can lead to the execution hanging as the aligner tries its best to match a long sequence of Ns to something, therefore this is off by default."
        },
        "normalizationTargetDepth": {
          "type": "integer",
          "title": "Normalisation target depth",
          "default": 200,
          "description": "Target depth of coverage to normalize to."
        },
        "discard_incorrect_primer_pairs": {
          "type": "boolean",
          "title": "Discard incorrect read pairs",
          "default": false,
          "description": "Discard read pairs that do not have the expected primer pairs, this can lead to coverage gaps in amplicon overlap regions where the fragment size is lower than the overlap so is off by default."
        },
        "primer_match_threshold": {
          "type": "integer",
          "title": "Primer fuzzy match window size",
          "default": 35,
          "description": "How far from the start of a read to allow a primer match. This compensates for homology between adaptor / barcode in the reference which may otherwise cause read pairs to be dropped."
        },
        "varMinFreqThreshold": {
          "type": "number",
          "title": "Ambiguous variant frequency threshold",
          "default": 0.25,
          "description": "Frequency threshold to call ambiguous variant"
        },
        "varFreqThreshold": {
          "type": "number",
          "title": "Unambiguous variant frequency threshold",
          "default": 0.75,
          "description": "Frequency threshold for unambiguous variant."
        },
        "varMinDepth": {
          "type": "integer",
          "title": "Variant caller minimum depth",
          "default": 10,
          "description": "Minimum coverage depth to call variant"
        },
        "min_mapq": {
          "type": "integer",
          "title": "Minimum mapping quality",
          "default": 20,
          "description": "Minimum mapping quality to consider a read for variant calling."
        },
        "skip_normalize_depth": {
          "type": "boolean",
          "title": "Skip depth normalization",
          "default": false,
          "description": "Skip depth normalization, this will make the pipeline slower."
        }
      }
    },
    "misc": {
      "title": "Miscellaneous Options",
      "type": "object",
      "description": "Everything else.",
      "default": "",
      "properties": {
        "help": {
          "type": "boolean",
          "default": false,
          "description": "Display help text.",
          "fa_icon": "fas fa-question-circle",
          "hidden": true
        },
        "version": {
          "type": "boolean",
          "default": false,
          "description": "Display version.",
          "fa_icon": "fas fa-code-branch",
          "hidden": true
        },
        "fastqSearchPath": {
          "type": "string",
          "title": "FASTQ search path",
          "description": "Path to search for FASTQ files.",
          "help_text": "Path to search for FASTQ files, this is used to find the FASTQ files in the directory specified in the `directory` parameter.",
          "hidden": true
        }
      }
    }
  },
  "allOf": [
    {
      "$ref": "#/definitions/input"
    },
    {
      "$ref": "#/definitions/primer_scheme_selection"
    },
    {
      "$ref": "#/definitions/output"
    },
    {
      "$ref": "#/definitions/squirrel_options"
    },
    {
      "$ref": "#/definitions/resource_options"
    },
    {
      "$ref": "#/definitions/advanced_options"
    },
    {
      "$ref": "#/definitions/misc"
    }
  ],
  "properties": {
    "aws_image_prefix": {
      "type": "string",
      "hidden": true
    },
    "aws_queue": {
      "type": "string",
      "hidden": true
    },
    "show_hidden_params": {
      "type": "boolean"
    }
  },
  "resources": {
    "recommended": {
      "cpus": 4,
      "memory": "8GB"
    },
    "minimum": {
      "cpus": 2,
      "memory": "4GB"
    },
    "run_time": "5 minutes per sample",
    "arm_support": false
  }
}