From 97e72a8b200c9d04da19660e5607ca4aedb6e82c Mon Sep 17 00:00:00 2001
From: "Gervaise H. Henry" <gervaise.henry@utsouthwestern.edu>
Date: Mon, 3 Aug 2020 15:42:09 -0500
Subject: [PATCH] Nextflow-ify bash command to extract median read length

---
 workflow/rna-seq.nf | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/workflow/rna-seq.nf b/workflow/rna-seq.nf
index e155a94..3e7e3aa 100644
--- a/workflow/rna-seq.nf
+++ b/workflow/rna-seq.nf
@@ -299,14 +299,14 @@ process trimData {
     if [ "${ends}" == "se" ]
     then
       trim_galore --gzip -q 25 --illumina --length 35 --basename ${repRID} -j `nproc` ${fastq[0]}
-      readLength=\$(zcat *_trimmed.fq.gz | awk '\{if(NR%4==2) print length(\${1})}' | sort -n | awk '\{a[NR]=$0}END\{print(NR%2==1)?a[int(NR/2)+1]:(a[NR/2]+a[NR/2+1])/2}')
+      readLength=\$(zcat *_trimmed.fq.gz | awk '{if(NR%4==2) print length(\${1})}' | sort -n | awk '{a[NR]=$0}END{print(NR%2==1)?a[int(NR/2)+1]:(a[NR/2]+a[NR/2+1])/2}')
     elif [ "${ends}" == "pe" ]
     then
       trim_galore --gzip -q 25 --illumina --length 35 --paired --basename ${repRID} -j `nproc` ${fastq[0]} ${fastq[1]}
-      readLength=\$(zcat *_1.fq.gz | awk '\{if(NR%4==2) print length(\${1})}' | sort -n | awk '\{a[NR]=$0}END\{print(NR%2==1)?a[int(NR/2)+1]:(a[NR/2]+a[NR/2+1])/2}')
+      readLength=\$(zcat *_1.fq.gz | awk '{if(NR%4==2) print length(\${1})}' | sort -n | awk '{a[NR]=$0}END{print(NR%2==1)?a[int(NR/2)+1]:(a[NR/2]+a[NR/2+1])/2}')
     fi
     echo -e "LOG: trimmed" >> ${repRID}.trimData.log
-    echo -e "LOG: average trimmed read length: /${readLength}" >> ${repRID}.trimData.log
+    echo -e "LOG: average trimmed read length: \${readLength}" >> ${repRID}.trimData.log
     
     # save read length file
     echo -e "\${readLength}" > readLength.csv
-- 
GitLab