From d9895270df438051129f9572eef17c85c47e98f9 Mon Sep 17 00:00:00 2001 From: s181706 <jonathan.gesell@utsouthwestern.edu> Date: Wed, 12 Feb 2020 12:06:22 -0600 Subject: [PATCH] Updated to include reference selection --- workflow/conf/biohpc.config | 4 ++-- workflow/rna-seq.nf | 48 ++++++++++++++++++++++++++----------- 2 files changed, 36 insertions(+), 16 deletions(-) diff --git a/workflow/conf/biohpc.config b/workflow/conf/biohpc.config index 56e7e6a..88787a7 100755 --- a/workflow/conf/biohpc.config +++ b/workflow/conf/biohpc.config @@ -16,13 +16,13 @@ process { executor = 'local' } withName:trimData { - queue = 'super' + queue = '128GB,256GB,256GBv1' } withName:alignData { queue = '256GB,256GBv1' } withName: dedupData { - queue = 'super' + queue = '128GB,256GB,256GBv1' } withName: fastqc { queue = 'super' diff --git a/workflow/rna-seq.nf b/workflow/rna-seq.nf index 98b05ad..28770ca 100755 --- a/workflow/rna-seq.nf +++ b/workflow/rna-seq.nf @@ -1,12 +1,19 @@ #!/usr/bin/env nextflow +// ######## #### ###### ######## +// ## ## ## ## ## ## +// ## ## ## ## ## +// ######## ## ## ###### +// ## ## ## ## ## +// ## ## ## ## ## ## +// ######## #### ###### ## + // Define input variables params.deriva = "${baseDir}/../test_data/auth/credential.json" params.bdbag = "${baseDir}/../test_data/auth/cookies.txt" //params.repRID = "16-1ZX4" params.repRID = "Q-Y5JA" -params.refVersion = "0.0.1" -params.refMuVersion = "38.P6.vM22" +params.refMoVersion = "38.p6.vM22" params.refHuVersion = "38.p12.v31" params.outDir = "${baseDir}/../output" @@ -18,15 +25,15 @@ bdbag = Channel .fromPath(params.bdbag) .ifEmpty { exit 1, "deriva cookie file for bdbag not found: ${params.bdbag}" } repRID = params.repRID -refVersion = params.refVersion -refMuVersion = params.refMuVersion +refMoVersion = params.refMoVersion refHuVersion = params.refHuVersion outDir = params.outDir logsDir = "${outDir}/Logs" // Define fixed files derivaConfig = Channel.fromPath("${baseDir}/conf/replicate_export_config.json") -referenceBase = "s3://bicf-references" +//referenceBase = "s3://bicf-references" +referenceBase = "/project/BICF/BICF_Core/shared/gudmap/references" // Define script files script_bdbagFetch = Channel.fromPath("${baseDir}/scripts/bdbagFetch.sh") @@ -186,9 +193,11 @@ stranded.into { } spike.into{ spike_getRef + spike_rseqc } species.into { species_getRef + species_rseqc } /* @@ -199,10 +208,6 @@ process getRef { publishDir "${logsDir}", mode: "copy", pattern: "*.getRef.err" input: - val referenceBase - val refVersion - val refMuVersion - val refHuVersion val spike_getRef val species_getRef @@ -215,13 +220,13 @@ process getRef { ulimit -a >>${repRID}.getRef.err export https_proxy=\${http_proxy} - # retreive appropriate reference from S3 bucket + # run set the reference name if [ "${species_getRef}" == "Mus musculus" ] then - references=\$(echo ${referenceBase}/mouse/${refVersion}/GRCm${refMuVersion}) + references=\$(echo ${referenceBase}/GRCm${refMoVersion}) elif [ '${species_getRef}' == "Homo sapiens" ] then - references=\$(echo ${referenceBase}/human/${refVersion}/GRCh${refHuVersion}) + references=\$(echo ${referenceBase}/GRCh${refHuVersion}) else exit 1 fi @@ -232,7 +237,17 @@ process getRef { then reference=\$(echo \${references}/) fi - aws s3 cp "\${references}" ./ --recursive >>${repRID}.getRef.err + + # retreive appropriate reference appropriate location + if [ ${referenceBase} == "s3://bicf-references" ] + then + aws s3 cp "\${references}" /hisat2 ./ --recursive >>${repRID}.getRef.err + aws s3 cp "\${references}" /bed ./ --recursive >>${repRID}.getRef.err + elif [ ${referenceBase} == "/project/BICF/BICF_Core/shared/gudmap/references" ] + then + cp -R "\${references}"/hisat2 ./ >>${repRID}.getRef.err + cp -R "\${references}"/bed ./ >>${repRID}.getRef.err + fi """ } @@ -268,6 +283,11 @@ process trimData { """ } +reference.into { + reference_alignData + reference_rseqc +} + /* * alignData: aligns the reads to a reference database */ @@ -279,7 +299,7 @@ process alignData { val endsManual_alignData val stranded_alignData path fastq from fastqs_trimmed - path reference + path reference_alignData output: path ("${repRID}.sorted.bam") into rawBam -- GitLab