From 172d32129f0fc9214b3eafcd28e23be2d1095772 Mon Sep 17 00:00:00 2001
From: "Gervaise H. Henry" <gervaise.henry@utsouthwestern.edu>
Date: Mon, 3 Aug 2020 15:41:02 -0500
Subject: [PATCH] Nextflow-ify bash command to extract median read length

---
 workflow/rna-seq.nf | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/workflow/rna-seq.nf b/workflow/rna-seq.nf
index 50e2aef..e155a94 100644
--- a/workflow/rna-seq.nf
+++ b/workflow/rna-seq.nf
@@ -299,11 +299,11 @@ process trimData {
     if [ "${ends}" == "se" ]
     then
       trim_galore --gzip -q 25 --illumina --length 35 --basename ${repRID} -j `nproc` ${fastq[0]}
-      readLength=\$(zcat *_trimmed.fq.gz | awk '{if(NR%4==2) print length(\${1})}' | sort -n | awk '{a[NR]=$0}END{print(NR%2==1)?a[int(NR/2)+1]:(a[NR/2]+a[NR/2+1])/2}')
+      readLength=\$(zcat *_trimmed.fq.gz | awk '\{if(NR%4==2) print length(\${1})}' | sort -n | awk '\{a[NR]=$0}END\{print(NR%2==1)?a[int(NR/2)+1]:(a[NR/2]+a[NR/2+1])/2}')
     elif [ "${ends}" == "pe" ]
     then
       trim_galore --gzip -q 25 --illumina --length 35 --paired --basename ${repRID} -j `nproc` ${fastq[0]} ${fastq[1]}
-      readLength=\$(zcat *_1.fq.gz | awk '{if(NR%4==2) print length(\${1})}' | sort -n | awk '{a[NR]=$0}END{print(NR%2==1)?a[int(NR/2)+1]:(a[NR/2]+a[NR/2+1])/2}')
+      readLength=\$(zcat *_1.fq.gz | awk '\{if(NR%4==2) print length(\${1})}' | sort -n | awk '\{a[NR]=$0}END\{print(NR%2==1)?a[int(NR/2)+1]:(a[NR/2]+a[NR/2+1])/2}')
     fi
     echo -e "LOG: trimmed" >> ${repRID}.trimData.log
     echo -e "LOG: average trimmed read length: /${readLength}" >> ${repRID}.trimData.log
-- 
GitLab