From 38d411ee1b85455d31fb8cfd96d94e7b2771ee5f Mon Sep 17 00:00:00 2001 From: "Gervaise H. Henry" <gervaise.henry@utsouthwestern.edu> Date: Mon, 3 Aug 2020 15:37:38 -0500 Subject: [PATCH] Nextflow-ify bash command to extract median read length --- workflow/rna-seq.nf | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/workflow/rna-seq.nf b/workflow/rna-seq.nf index ee012c2..50e2aef 100644 --- a/workflow/rna-seq.nf +++ b/workflow/rna-seq.nf @@ -299,11 +299,11 @@ process trimData { if [ "${ends}" == "se" ] then trim_galore --gzip -q 25 --illumina --length 35 --basename ${repRID} -j `nproc` ${fastq[0]} - readLength=$(zcat *_trimmed.fq.gz | awk '{if(NR%4==2) print length($1)}' | sort -n | awk '{a[NR]=$0}END{print(NR%2==1)?a[int(NR/2)+1]:(a[NR/2]+a[NR/2+1])/2}') + readLength=\$(zcat *_trimmed.fq.gz | awk '{if(NR%4==2) print length(\${1})}' | sort -n | awk '{a[NR]=$0}END{print(NR%2==1)?a[int(NR/2)+1]:(a[NR/2]+a[NR/2+1])/2}') elif [ "${ends}" == "pe" ] then trim_galore --gzip -q 25 --illumina --length 35 --paired --basename ${repRID} -j `nproc` ${fastq[0]} ${fastq[1]} - readLength=$(zcat *_1.fq.gz | awk '{if(NR%4==2) print length($1)}' | sort -n | awk '{a[NR]=$0}END{print(NR%2==1)?a[int(NR/2)+1]:(a[NR/2]+a[NR/2+1])/2}') + readLength=\$(zcat *_1.fq.gz | awk '{if(NR%4==2) print length(\${1})}' | sort -n | awk '{a[NR]=$0}END{print(NR%2==1)?a[int(NR/2)+1]:(a[NR/2]+a[NR/2+1])/2}') fi echo -e "LOG: trimmed" >> ${repRID}.trimData.log echo -e "LOG: average trimmed read length: /${readLength}" >> ${repRID}.trimData.log -- GitLab