Skip to content
Snippets Groups Projects
Commit 00ee468b authored by Gervaise Henry's avatar Gervaise Henry :cowboy:
Browse files

Pass raw ends

parent 1f7ba7d5
Branches
Tags
2 merge requests!58Develop,!56Resolve "Detect error in inferMetadata for tracking"
Pipeline #8815 failed with stages
in 2 minutes and 30 seconds
...@@ -107,13 +107,14 @@ parseMetadata: ...@@ -107,13 +107,14 @@ parseMetadata:
- rep=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p repRID) - rep=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p repRID)
- exp=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p expRID) - exp=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p expRID)
- study=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p studyRID) - study=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p studyRID)
- endsMeta=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p endsMeta) - endsRaw=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p endsMeta)
- endsMeta="uk"
- endsManual=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p endsManual) - endsManual=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p endsManual)
- stranded=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p stranded) - stranded=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p stranded)
- spike=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p spike) - spike=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p spike)
- species=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p species) - species=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p species)
- readLength=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p readLength) - readLength=$(singularity run 'docker://gudmaprbk/python3:1.0.0' python3 ./workflow/scripts/parse_meta.py -r Replicate_RID -m "./test_data/meta/metaTest.csv" -p readLength)
- echo -e "${endsMeta},${endsManual},${stranded},${spike},${species},${readLength},${exp},${study},${rep}" > design.csv - echo -e "${endsMeta},${endsRaw},${endsManual},${stranded},${spike},${species},${readLength},${exp},${study},${rep}" > design.csv
- pytest -m parseMetadata - pytest -m parseMetadata
artifacts: artifacts:
name: "$CI_JOB_NAME" name: "$CI_JOB_NAME"
......
...@@ -310,8 +310,21 @@ process parseMetadata { ...@@ -310,8 +310,21 @@ process parseMetadata {
echo -e "LOG: study RID metadata parsed: \${study}" >> ${repRID}.parseMetadata.log echo -e "LOG: study RID metadata parsed: \${study}" >> ${repRID}.parseMetadata.log
# get endedness metadata # get endedness metadata
endsMeta=\$(python3 ${script_parseMeta} -r ${repRID} -m "${experimentSettings}" -p endsMeta) endsRaw=\$(python3 ${script_parseMeta} -r ${repRID} -m "${experimentSettings}" -p endsMeta)
echo -e "LOG: endedness metadata parsed: \${endsMeta}" >> ${repRID}.parseMetadata.log echo -e "LOG: endedness metadata parsed: \${endsRaw}" >> ${repRID}.parseMetadata.log
if [ "\${endsRaw}" == "Single Read" ]
then
endsMeta="se"
elif [ "\${endsRaw}" == "Paired End" ]
then
endsMeta="pe"
else
endsMeta="unknown"
fi
if [ "\${endsRaw}" == "" ]
then
endsRaw="_No value_"
fi
# ganually get endness # ganually get endness
endsManual=\$(python3 ${script_parseMeta} -r ${repRID} -m "${file}" -p endsManual) endsManual=\$(python3 ${script_parseMeta} -r ${repRID} -m "${file}" -p endsManual)
...@@ -344,18 +357,18 @@ process parseMetadata { ...@@ -344,18 +357,18 @@ process parseMetadata {
then then
fastqCountError=true fastqCountError=true
fastqCountError_details="Too many fastqs detected (>2)" fastqCountError_details="Too many fastqs detected (>2)"
elif [ "\${endsMeta}"" == "Single Read" ] && [ "${fastqCount}" -ne "1" ] elif [ "\${endsMeta}"" == "se" ] && [ "${fastqCount}" -ne "1" ]
then then
fastqCountError=true fastqCountError=true
fastqCountError_details="Number of fastqs detected does not match submitted endness" fastqCountError_details="Number of fastqs detected does not match submitted endness"
elif [ "\${endsMeta}"" == "Paired End" ] && [ "${fastqCount}" -ne "2" ] elif [ "\${endsMeta}"" == "pe" ] && [ "${fastqCount}" -ne "2" ]
then then
fastqCountError=true fastqCountError=true
fastqCountError_details="Number of fastqs detected does not match submitted endness" fastqCountError_details="Number of fastqs detected does not match submitted endness"
fi fi
# save design file # save design file
echo -e "\${endsMeta},\${endsManual},\${stranded},\${spike},\${species},\${readLength},\${exp},\${study}" > design.csv echo -e "\${endsMeta},\${endsRaw},\${endsManual},\${stranded},\${strandedRaw},\${spike},\${species},\${readLength},\${exp},\${study}" > design.csv
# save fastq count error file # save fastq count error file
echo -e "\${fastqCountError},\${fastqCountError_details}" > fastqCountError.csv echo -e "\${fastqCountError},\${fastqCountError_details}" > fastqCountError.csv
...@@ -364,6 +377,7 @@ process parseMetadata { ...@@ -364,6 +377,7 @@ process parseMetadata {
// Split metadata into separate channels // Split metadata into separate channels
endsMeta = Channel.create() endsMeta = Channel.create()
endsRaw = Channel.create()
endsManual = Channel.create() endsManual = Channel.create()
strandedMeta = Channel.create() strandedMeta = Channel.create()
spikeMeta = Channel.create() spikeMeta = Channel.create()
...@@ -373,6 +387,7 @@ expRID = Channel.create() ...@@ -373,6 +387,7 @@ expRID = Channel.create()
studyRID = Channel.create() studyRID = Channel.create()
metadata_fl.splitCsv(sep: ",", header: false).separate( metadata_fl.splitCsv(sep: ",", header: false).separate(
endsMeta, endsMeta,
endsRaw,
endsManual, endsManual,
strandedMeta, strandedMeta,
spikeMeta, spikeMeta,
...@@ -1939,6 +1954,7 @@ process failExecutionRun { ...@@ -1939,6 +1954,7 @@ process failExecutionRun {
val executionRunRID from executionRunRID_failExecutionRun val executionRunRID from executionRunRID_failExecutionRun
val inputBagRID from inputBagRID_failExecutionRun val inputBagRID from inputBagRID_failExecutionRun
val endsMeta from endsMeta_failExecutionRun val endsMeta from endsMeta_failExecutionRun
val endsRaw
val strandedMeta from strandedMeta_failExecutionRun val strandedMeta from strandedMeta_failExecutionRun
val spikeMeta from spikeMeta_failExecutionRun val spikeMeta from spikeMeta_failExecutionRun
val speciesMeta from speciesMeta_failExecutionRun val speciesMeta from speciesMeta_failExecutionRun
...@@ -1985,15 +2001,6 @@ process failExecutionRun { ...@@ -1985,15 +2001,6 @@ process failExecutionRun {
pipelineError_details=\$(echo \${pipelineError_details}"|:-:|-:|-:|\\n") pipelineError_details=\$(echo \${pipelineError_details}"|:-:|-:|-:|\\n")
if ${pipelineError_ends} if ${pipelineError_ends}
then then
if [ "${endsMeta}" == "se" ]
then
endMeta="Single End"
elif [ "${endsMeta}" == "pe" ]
then
endMeta="Paired End"
else
endMeta="unknown"
fi
if [ "${endsInfer}" == "se" ] if [ "${endsInfer}" == "se" ]
then then
endInfer="Single End" endInfer="Single End"
...@@ -2003,7 +2010,7 @@ process failExecutionRun { ...@@ -2003,7 +2010,7 @@ process failExecutionRun {
else else
endInfer="unknown" endInfer="unknown"
fi fi
pipelineError_details=\$(echo \${pipelineError_details}"|Paired End|"\${endMeta}"|"\${endInfer}"|\\n") pipelineError_details=\$(echo \${pipelineError_details}"|Paired End|${endsRaw}|"\${endInfer}"|\\n")
fi fi
if ${pipelineError_stranded} if ${pipelineError_stranded}
then then
......
...@@ -62,12 +62,7 @@ def main(): ...@@ -62,12 +62,7 @@ def main():
# Get endedness metadata from 'Experiment Settings.csv' # Get endedness metadata from 'Experiment Settings.csv'
if (args.parameter == "endsMeta"): if (args.parameter == "endsMeta"):
if (metaFile.Paired_End.unique() == "Single End"): endsMeta = metaFile.Paired_End.unique()
endsMeta = "se"
elif (metaFile.Paired_End.unique() == "Paired End"):
endsMeta = "pe"
else:
endsMeta = "uk"
print(endsMeta) print(endsMeta)
# Manually get endness count from 'File.csv' # Manually get endness count from 'File.csv'
......
...@@ -19,7 +19,7 @@ def readLine(fileName): ...@@ -19,7 +19,7 @@ def readLine(fileName):
data = False data = False
file = open(fileName, "r") file = open(fileName, "r")
line = file.readline() line = file.readline()
if line.strip() == "uk,se,unstranded,no,Homo sapiens,75,Experiment_RID,Study_RID,Replicate_RID": if line.strip() == "uk,uk,se,unstranded,no,Homo sapiens,75,Experiment_RID,Study_RID,Replicate_RID":
data = True data = True
return data return data
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment