Skip to content
Snippets Groups Projects
Commit c2b05eaa authored by Jonathan Gesell's avatar Jonathan Gesell
Browse files

Updated for concise output files

parent 9c845c6e
Branches
Tags
3 merge requests!37v0.0.1,!4Develop,!2Resolve "process_getData"
#!/usr/bin/env nextflow #!/usr/bin/env nextflow
// Define input variables // Define input variables
params.deriva = "${baseDir}/../test_data/deriva-cookies.txt" params.deriva = "/project/BICF/BICF_Core/shared/gudmap/cookies/deriva-cookies.txt"
params.bdbag = "${baseDir}/../test_data/Study_Q-Y4H0.zip" params.bdbag = "${baseDir}/../test_data/Study_Q-Y4H0.zip"
params.outDir = "${baseDir}/../output" params.outDir = "${baseDir}/../output"
// Parse input variables // Parse input variables
deriva = file(params.deriva) deriva = file(params.deriva, checkIfExists: 'true')
bdbag = Channel bdbag = Channel
.fromPath(params.bdbag) .fromPath(params.bdbag)
.ifEmpty { exit 1, "bdbag zip file not found: ${params.bdbag}" } .ifEmpty { exit 1, "bdbag zip file not found: ${params.bdbag}" }
...@@ -19,10 +19,10 @@ outDir = params.outDir ...@@ -19,10 +19,10 @@ outDir = params.outDir
*/ */
process splitData { process splitData {
tag "${bdbag.baseName}" tag "${bdbag.baseName}"
publishDir "${outDir}/temp/${task.process}", mode: "symlink"
input: input:
file bdbag file bdbag
path cookies, stageAs: 'cookies.txt' from deriva
output: output:
file("Replicate_*.zip") into bdbagSplit mode flatten file("Replicate_*.zip") into bdbagSplit mode flatten
...@@ -34,48 +34,44 @@ process splitData { ...@@ -34,48 +34,44 @@ process splitData {
""" """
hostname hostname
ulimit -a ulimit -a
ln -sf `readlink -e ${deriva}` ~/.bdbag/deriva-cookies.txt ln -sf `readlink -e cookies.txt` ~/.bdbag/deriva-cookies.txt
echo LOG: deriva cookie linked echo "LOG: deriva cookie linked"
study=`echo "${bdbag}" | cut -d'.' -f1` study=`echo "${bdbag}" | cut -d '.' -f1`
echo LOG: \${study} echo "LOG: \${study}"
unzip ${bdbag} unzip ${bdbag}
echo LOG: bdgag unzipped echo "LOG: bdgag unzipped"
python3 ${baseDir}/scripts/modifyFetch.py --fetchFile \${study} python3 ${baseDir}/scripts/modifyFetch.py --fetchFile \${study}
echo LOG: fetch file filtered for only .fastq.gz echo "LOG: fetch file filtered for only .fastq.gz"
python3 ${baseDir}/scripts/splitFetch.py --fetchFile \${study} python3 ${baseDir}/scripts/splitFetch.py --fetchFile \${study}
echo LOG: fetch file split by replicates echo "LOG: fetch file split by replicates"
sh ${baseDir}/scripts/splitBag.sh \${study} sh ${baseDir}/scripts/splitBag.sh \${study}
echo LOG: bag recreated with replicate split fetch file echo "LOG: bag recreated with replicate split fetch file"
""" """
} }
println {${http_proxy}}
println {${https_proxy}}
/* /*
* getData: fetch study files from consortium with downloaded bdbag.zip * getData: fetch study files from consortium with downloaded bdbag.zip
*/ */
process getData { process getData {
tag "${rep.baseName}" tag "${rep.baseName}"
publishDir "${outDir}/temp/${task.process}", mode: "symlink" publishDir "${outDir}/tempOut/fastqs", mode: "symlink"
input: input:
each rep from bdbagSplit each rep from bdbagSplit
output: output:
file("**/*.R*.fastq.gz") into fastq path ("*.R*.fastq.gz", type: 'file', maxDepth: '0') into fastq
script: script:
""" """
hostname hostname
ulimit -a ulimit -a
echo LOG:\${http_proxy}
export https_proxy=\${http_proxy} export https_proxy=\${http_proxy}
replicate=\$(echo "${rep}" | cut -d'.' -f1 | rev | cut -f1 -d '/' | rev) replicate=\$(basename "${rep}" | cut -d '.' -f1)
echo LOG: \${replicate} echo "LOG: \${replicate}"
unzip ${rep} unzip ${rep}
echo LOG: replicate bdbag unzipped echo "LOG: replicate bdbag unzipped"
sh ${baseDir}/scripts/bdbagFetch.sh \${replicate} sh ${baseDir}/scripts/bdbagFetch.sh \${replicate}
echo LOG: replicate bdbag fetched echo "LOG: replicate bdbag fetched"
""" """
} }
#!/bin #!/bin/bash
bdbag --resolve-fetch all --fetch-filter filename\$*fastq.gz $1 bdbag --resolve-fetch all --fetch-filter filename\$*fastq.gz $1 &&
\ No newline at end of file for i in $(find */ -name "*.R*.fastq.gz"); do
mv ${i} .;
done;
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment