ikmb
diff --git a/‎README.md‎
Lines changed: 9 additions & 1 deletion b/‎README.md‎
Lines changed: 9 additions & 1 deletion
diff --git a/‎bin/gendx_parser.rb‎
Lines changed: 8 additions & 1 deletion b/‎bin/gendx_parser.rb‎
Lines changed: 8 additions & 1 deletion
diff --git a/‎bin/report.rb‎
Lines changed: 1 addition & 1 deletion b/‎bin/report.rb‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎conf/base.config‎
Lines changed: 26 additions & 37 deletions b/‎conf/base.config‎
Lines changed: 26 additions & 37 deletions
diff --git a/‎main.nf‎
Lines changed: 1 addition & 0 deletions b/‎main.nf‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎modules/bwa.nf‎
Lines changed: 0 additions & 29 deletions b/‎modules/bwa.nf‎
Lines changed: 0 additions & 29 deletions
diff --git a/‎modules/bwa/mem.nf‎
Lines changed: 34 additions & 0 deletions b/‎modules/bwa/mem.nf‎
Lines changed: 34 additions & 0 deletions
diff --git a/‎modules/concat_fastq.nf‎
Lines changed: 3 additions & 1 deletion b/‎modules/concat_fastq.nf‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎modules/custom/dumpsoftwareversions/main.nf‎
Lines changed: 18 additions & 0 deletions b/‎modules/custom/dumpsoftwareversions/main.nf‎
Lines changed: 18 additions & 0 deletions
diff --git a/‎modules/custom/dumpsoftwareversions/meta.yml‎
Lines changed: 34 additions & 0 deletions b/‎modules/custom/dumpsoftwareversions/meta.yml‎
Lines changed: 34 additions & 0 deletions
@@ -2,7 +2,15 @@
 
 # IKMB HLA pipeline
 
-This pipeline performs HLA typing from short read NGS data. 
+This pipeline performs HLA typing from short read NGS data. Several tools are supported:
+
+* [xHLA](https://github.com/humanlongevity/HLA) (xhla)
+* [Hisat-genotype](https://daehwankimlab.github.io/hisat-genotype/) (hisat)   Slow on anything other than targetted sequencing!
+* [Optitype](https://github.com/FRED-2/OptiType) (optitype)
+* [HLAscan](https://github.com/SyntekabioTools/HLAscan) (hlascan)
+* [HLA-HD](https://www.genome.med.kyoto-u.ac.jp/HLA-HD/) (hlahd)
+
+For usage instructions, please see below. 
 
 ## Documentation 
 
 
@@ -113,7 +113,7 @@ def hisat_reconcile(list)
 
 # FIND MATCHING JSON FILE
 json = jsons.find{|j| j.include?(sample) }
-abort "Could not find matching json file (#{sample}) under provided path!"
+abort "Could not find matching json file (#{sample}) under the path provided!"
 
 # Build a HASH per gene, for each calling approach - starting with GenDX
 if json
@@ -213,6 +213,13 @@ def hisat_reconcile(list)
 				if tool == "Hisat"
 					tcalls = hisat_reconcile(tcalls)
 				end
+			
+				tcalls = tcalls.select {|tc| tc.length > 1 }
+
+				# if only one call exists, we assume it is homozygous and we double it. 
+				if tcalls.length == 1
+					tcalls << tcalls[0]
+				end
 
 				tcalls.sort[0..1].each_with_index do |t,i|
 
 
@@ -248,7 +248,7 @@
 	r = [ k ]
 	this_result = [ k ]
 	rheader[1..-1].each do |h|
-		this_result << alleles[k][h].sort.join("\n")
+		this_result << alleles[k][h].sort.map {|a| a.split("*")[-1]}.join("\n")
 	end
 	results << this_result
 end
 
@@ -18,51 +18,40 @@ process {
 
   // software dependencies moved to conda.config
 
-  withName:FASTP {
-        cpus = 4
-  }
-  withName: HISAT_GENOTYPE {
-        time = { check_max( 12.h * task.attempt, 'time' ) }
-        memory = { check_max( 64.GB * task.attempt, 'memory' ) }
-        cpus = params.max_cpus/2
-  } 
-
-  withName: 'DEDUP|BAM2FASTQ|BEDCOV' {
-	cpus = 8
-	memory = { check_max( 8.GB * task.attempt, 'memory' ) }
-
+  withLabel: short_serial {
+	time = { check_max( 4.h * task.attempt, 'time' ) }
+      memory = { check_max( 8.GB * task.attempt, 'memory' ) }
   }
-  withName: 'XHLA' {
-	memory = { check_max( 32.GB * task.attempt, 'memory' ) }
+  withLabel: medium_serial {
+	time = { check_max( 8.h * task.attempt, 'time' ) }
+      memory = { check_max( 8.GB * task.attempt, 'memory' ) }
   }
-
-  withName: 'HLASCAN' {
-	cpus = 4
-        memory = { check_max( 32.GB * task.attempt, 'memory' ) }
+  withLabel: long_serial {
+    time = { check_max( 12.h * task.attempt, 'time' ) }
+    memory = { check_max( 16.GB * task.attempt, 'memory' ) }
   }
-
-  withName: 'BWA' {
-	time = { check_max( 12.h * task.attempt, 'time' ) }
-        memory = { check_max( 64.GB * task.attempt, 'memory' ) }
-        cpus = { check_max( 12 * task.attempt, 'cpus' ) }
+  withLabel: short_parallel {
+	  time = { check_max( 4.h * task.attempt, 'time' ) }
+    memory = { check_max( 16.GB * task.attempt, 'memory' ) }
+    cpus = { check_max( 4 * task.attempt, 'cpus' ) }
   }
-
-  withLabel: 'optitype' {
-	container = "docker://quay.io/biocontainers/optitype:1.3.5--hdfd78af_1"
+  withLabel: medium_parallel {
+	  time = { check_max( 8.h * task.attempt, 'time' ) }
+    memory = { check_max( 24.GB * task.attempt, 'memory' ) }
+    cpus = { check_max( 8 * task.attempt, 'cpus' ) }
   }
-
-  withName: 'OPTITYPE_FILTER' {
-        time = { check_max( 12.h * task.attempt, 'time' ) }
-        memory = { check_max( 64.GB * task.attempt, 'memory' ) }
-        cpus = { check_max( 10 * task.attempt, 'cpus' ) }
+  withLabel: long_parallel {
+	  time = { check_max( 24.h * task.attempt, 'time' ) }
+    memory = { check_max( 24.GB * task.attempt, 'memory' ) }
+    cpus = { check_max( 8 * task.attempt, 'cpus' ) }
   }
-  withName: 'OPTITYPE_RUN' {
-	time = { check_max( 4.h * task.attempt, 'time' ) }
-        memory = { check_max( 32.GB * task.attempt, 'memory' ) }
-        cpus = 12
+  withLabel: extra_long_parallel {
+    time = { check_max( 96.h * task.attempt, 'time' ) }
+    memory = { check_max( 24.GB * task.attempt, 'memory' ) }
+    cpus = { check_max( 8 * task.attempt, 'cpus' ) }
   }
 
-
+  
 }
 
 
 
@@ -27,6 +27,7 @@ WorkflowHla.initialise( params, log)
 
 params.fasta = file(params.genomes[ "hg38" ].fasta, checkIfExists: true)
 params.dict = file(params.genomes[ "hg38" ].dict, checkIfExists: true)
+params.fai = file(params.genomes[ "hg38" ].fasta + ".fai", checkIfExists: true)
 
 include { HLA } from './workflows/hla'
 
 
@@ -0,0 +1,34 @@
+process BWA_MEM {
+
+    tag "${meta.patient_id}|${meta.sample_id}"
+
+    label 'medium_parallel'
+
+    input:
+    tuple val(meta), path(left),path(right)
+    val(bwa_index)
+    
+    output:
+	tuple val(meta), path(bam), emit: bam
+	val(sample), emit: sample_name
+    val(meta), emit: meta_data
+	path("versions.yml"), emit: versions
+    
+	script:
+	bam = "${meta.sample_id}_${meta.library_id}_${meta.readgroup_id}_bwa-aligned_fm.bam"
+	sample = "${meta.patient_id}_${meta.sample_id}"
+
+    """
+    bwa mem -H ${params.dict} -M -R "@RG\\tID:${meta.readgroup_id}\\tPL:ILLUMINA\\tPU:${meta.platform_unit}\\tSM:${meta.patient_id}_${meta.sample_id}\\tLB:${meta.library_id}\\tDS:${bwa_index}\\tCN:${meta.center}" \
+        -t ${task.cpus} ${bwa_index} $left $right \
+        | samtools fixmate -@ ${task.cpus} -m - - \
+		| samtools sort -@ ${task.cpus} -m 4G -O bam -o $bam - 
+	
+    cat <<-END_VERSIONS > versions.yml
+    "${task.process}":
+        bwa: \$(echo \$(bwa 2>&1) | sed 's/^.*Version: //; s/Contact:.*\$//')
+        samtools: \$(echo \$(samtools --version 2>&1) | sed 's/^.*samtools //; s/Using.*\$//')
+    END_VERSIONS
+		
+    """	
+}
@@ -1,5 +1,7 @@
 process CONCAT_FASTQ {
 
+    tag "${meta.sample_id}"
+
     //publishDir "${params.outdir}/GenDX", mode: 'copy'
 
     input:
@@ -17,4 +19,4 @@ process CONCAT_FASTQ {
         zcat $r2 | gzip -c >> $r2_merged
     """
 
-}
+}
@@ -0,0 +1,18 @@
+process CUSTOM_DUMPSOFTWAREVERSIONS {
+
+    label 'short_serial'
+
+    container 'quay.io/biocontainers/multiqc:1.11--pyhdfd78af_0'
+
+    input:
+    path versions
+
+    output:
+    path "software_versions.yml"    , emit: yml
+    path "software_versions_mqc.yml", emit: mqc_yml
+    path "versions.yml"             , emit: versions
+
+    script:
+    template 'dumpsoftwareversions.py'
+
+}
@@ -0,0 +1,34 @@
+name: custom_dumpsoftwareversions
+description: Custom module used to dump software versions within the nf-core pipeline template
+keywords:
+  - custom
+  - version
+tools:
+  - custom:
+      description: Custom module used to dump software versions within the nf-core pipeline template
+      homepage: https://github.com/nf-core/tools
+      documentation: https://github.com/nf-core/tools
+      licence: ["MIT"]
+input:
+  - versions:
+      type: file
+      description: YML file containing software versions
+      pattern: "*.yml"
+
+output:
+  - yml:
+      type: file
+      description: Standard YML file containing software versions
+      pattern: "software_versions.yml"
+  - mqc_yml:
+      type: file
+      description: MultiQC custom content YML file containing software versions
+      pattern: "software_versions_mqc.yml"
+  - versions:
+      type: file
+      description: File containing software versions
+      pattern: "versions.yml"
+
+authors:
+  - "@drpatelh"
+  - "@grst"