genomic-medicine-sweden · jemten · Oct 31, 2023 · Oct 30, 2023 · ramprasadn · Oct 31, 2023
@@ -28,9 +28,13 @@ workflow ALIGNMENT {
     main:
         ch_versions = Channel.empty()
 
-        CAT_FASTQ(reads)
+        ch_fastq = branchFastqToSingleAndMulti(reads)
 
-        FASTP(CAT_FASTQ.out.reads,[],false,false)
+        CAT_FASTQ(ch_fastq.multiple_fq)
+        .reads.mix(ch_fastq.single_fq)
+        .set { ch_cat_fastq }
+
+        FASTP(ch_cat_fastq, [], false, false)
 
         STAR_ALIGN(FASTP.out.reads, star_index, gtf, false, 'illumina', false)
 
@@ -86,3 +90,32 @@ workflow ALIGNMENT {
         salmon_info     = SALMON_QUANT.out.json_info
         versions        = ch_versions
 }
+
+
+// Custom functions
+
+/**
+* Branch the read channel into differnt channels,
+* depending on whether the sample has multiple fastq files or not.
+* The resulting channels gets the original sample id in meta.
+*
+* @param ch_reads Channel containing meta and fastq reads
+* @return Channel containing meta with original id and branched on number of fastq files
+*/
+def branchFastqToSingleAndMulti(ch_reads) {
+
+    return ch_reads
+        .map {
+            meta, fastq ->
+                original_id = meta.id.split('_T')[0..-2].join('_')
+                [ meta + [id: original_id], fastq ]
+        }
+        .groupTuple()
+        .branch {
+            meta, fastq ->
+                single_fq: fastq.size() == 1
+                    return [ meta, fastq.flatten() ]
+                multiple_fq: fastq.size() > 1
+                    return [ meta, fastq.flatten() ]
+        }
+}
         In addition to the validation, also rename all samples to have a suffix of _T{n}, where n is the 
         In addition to the validation, also rename all samples to have a suffix of _T{n}, where n is the