Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
RNA-seq
Manage
Activity
Members
Labels
Plan
Issues
12
Issue boards
Milestones
Iterations
Wiki
Requirements
Code
Merge requests
0
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Snippets
Locked files
Build
Pipelines
Jobs
Pipeline schedules
Test cases
Artifacts
Deploy
Releases
Container Registry
Operate
Environments
Monitor
Incidents
Service Desk
Analyze
Value stream analytics
Contributor analytics
CI/CD analytics
Repository analytics
Code review analytics
Issue analytics
Insights
Model experiments
Help
Help
Support
GitLab documentation
Compare GitLab plans
Community forum
Contribute to GitLab
Provide feedback
Keyboard shortcuts
?
Snippets
Groups
Projects
GUDMAP_RBK
RNA-seq
Commits
d1271604
There was an error fetching the commit references. Please try again later.
Commit
d1271604
authored
4 years ago
by
Gervaise Henry
🤠
Browse files
Options
Downloads
Patches
Plain Diff
Add seqwho infer QC table to multiqc
parent
d9be943e
2 merge requests
!76
Develop
,
!71
Seqwho
Pipeline
#9318
failed with stages
in 3 minutes and 20 seconds
Changes
2
Pipelines
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
rna-seq.nf
+17
-5
17 additions, 5 deletions
rna-seq.nf
workflow/conf/multiqc_config.yaml
+28
-2
28 additions, 2 deletions
workflow/conf/multiqc_config.yaml
with
45 additions
and
7 deletions
rna-seq.nf
+
17
−
5
View file @
d1271604
...
...
@@ -683,6 +683,7 @@ process seqwho {
val fastqReadError from fastqReadError_seqwho
output:
path "seqwhoInfer.tsv" into seqwhoInfer
path "inferSpecies.csv" into inferSpecies_fl
path "inferError.csv" into inferError_fl
...
...
@@ -828,6 +829,7 @@ process seqwho {
seqtypeError_details="**Infered sequencing type does not match for R1 and R2:** Infered R1 = \${seqtypeR1} and infered R2 = \${seqtypeR2}"
echo -e "LOG: inference error: \${seqtypeError_details}" >> ${repRID}.seqwho.log
fi
consensus="-"
else
echo -e "LOG: low confidence seq type inference detected" >> ${repRID}.seqwho.log
seqtk sample -s100 ${fastq[0]} 1000000 1> sampled.1.seed100.fastq &
...
...
@@ -845,9 +847,9 @@ process seqwho {
cp SeqWho_call.tsv SeqWho_call_sampledR1.tsv
if [ "\${seqtypeR1_1}" == "\${seqtypeR1}" ] && [ "\${seqtypeR1_2}" == "\${seqtypeR1}" ] && [ "\${seqtypeR1_3}" == "\${seqtypeR1}" ]
then
con
c
ensus=true
con
s
ensus=true
else
con
c
ensus=false
con
s
ensus=false
fi
if [ "${ends}" == "pe" ]
then
...
...
@@ -866,12 +868,12 @@ process seqwho {
cp SeqWho_call.tsv SeqWho_call_sampledR2.tsv
if [ "\${seqtypeR2_1}" == "\${seqtypeR1}" ] && [ "\${seqtypeR2_2}" == "\${seqtypeR1}" ] && [ "\${seqtypeR2_3}" == "\${seqtypeR1}" ]
then
con
c
ensus=\${con
c
ensus}
con
s
ensus=\${con
s
ensus}
else
con
c
ensus=false
con
s
ensus=false
fi
fi
if [ \${con
c
ensus} == false ]
if [ \${con
s
ensus} == false ]
then
seqtypeError=true
seqtypeError_details=\$(echo "**Infered species confidence is low:**\\n")
...
...
@@ -901,7 +903,16 @@ process seqwho {
speciesError=false
echo -e "LOG: species matches: Submitted=${speciesMeta}; Inferred=\${speciesInfer}" >> ${repRID}.seqwho.log
fi
# save seqwho multiqc report
echo -e "Read\tSeq Type\tSpecies\tConfidence\tSeq Type Confidence\tSeq Type Consensus\tSpecies Confidence" > seqwhoInfer.tsv
echo -e "Read 1\y\${seqtypeR1}\t\${speciesR1}\t\${confidenceR1}\${seqtypeConfidenceR1}\t\${consensus}\t\${speciesConfidenceR1}" >> seqwhoInfer.tsv
if [ "${ends}" == "pe" ]
then
echo -e "Read 2\y\${seqtypeR2}\t\${speciesR2}\t\${confidenceR2}\${seqtypeConfidenceR2}\t\${consensus}\t\${speciesConfidenceR2}" >> seqwhoInfer.tsv
fi
# save species file
echo "\${speciesInfer}" > inferSpecies.csv
...
...
@@ -2008,6 +2019,7 @@ process aggrQC {
input:
path multiqcConfig
path bicfLogo
path seqwhoInfer
path softwareReferences
path softwareVersions
path fastqc
...
...
This diff is collapsed.
Click to expand it.
workflow/conf/multiqc_config.yaml
+
28
−
2
View file @
d1271604
...
...
@@ -37,10 +37,10 @@ top_modules:
name
:
'
Count'
info
:
'
Replicate
Feature
Count
QC
Results'
-
hisat2
:
name
:
'
Inference:
Alig
n'
name
:
'
Inference:
Spike-i
n'
info
:
'
Inference
Alignment
(1M
downsampled
reads)
QC
Results'
path_filters
:
-
'
*
alignSampleSummary*'
-
'
ERCC.
alignSampleSummary*'
-
rseqc
:
name
:
'
Inference:
Stranded'
info
:
'
1M
Downsampled
Reads
Strandedness
Inference
Results'
...
...
@@ -166,6 +166,30 @@ custom_data:
71 -
80
81 -
90
91 -
100
seqwho
:
file_format
:
'
tsv'
section_name
:
'
Inference:
Sequencing
Type
&
Species'
description
:
'
This
is
the
inference
results
from
the
SeqWho
tool'
plot_type
:
'
table'
pconfig
:
id
:
'
ref'
scale
:
false
format
:
'
{}'
headers
:
Read
:
description
:
'
Sequencing
read
(R1/R2)'
Seq Type
:
description
:
'
Inferred
Sequence
Type'
Species
:
description
:
'
Inferred
Species'
Confidence
:
description
:
'
Call
confidence'
Seq Type Confidence
:
description
:
'
Seqence
type
call
confidence
(1=high,
0=low)'
Seq Type Consensus
:
description
:
'
Low
confidence
sequence
type
call
sampling
inference
consensus'
Species Confidence
:
description
:
'
Species
call
confidence
(1=high,
0=low)'
sp
:
run
:
...
...
@@ -178,3 +202,5 @@ sp:
fn
:
'
reference.tsv'
tin
:
fn
:
'
*_tin.hist.tsv'
seqwho
:
fn
:
'
seqwhoInfer.tsv'
This diff is collapsed.
Click to expand it.
Preview
0%
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Save comment
Cancel
Please
register
or
sign in
to comment