From e78c5af1c7d8601894bb63dfaba18f5a8561c2d7 Mon Sep 17 00:00:00 2001 From: Holly Ruess <holly.ruess@utsouthwestern.edu> Date: Fri, 18 Jan 2019 09:38:37 -0600 Subject: [PATCH] add Pearson Correlation, make plots pdf --- workflow/.DS_Store | Bin 0 -> 6148 bytes workflow/main.nf | 2 +- workflow/scripts/experiment_qc.py | 27 ++++++++++++++++++++++++--- workflow/tests/test_experiment_qc.py | 6 ++++-- 4 files changed, 29 insertions(+), 6 deletions(-) create mode 100644 workflow/.DS_Store diff --git a/workflow/.DS_Store b/workflow/.DS_Store new file mode 100644 index 0000000000000000000000000000000000000000..1cfdf47763f95697736ca7303755f243846e9ca2 GIT binary patch literal 6148 zcmeHK&1%~~5T5l<ymlz{p->-n$;}75Y3)-$IPRghfI@O;N+Q*!5xA1E<e0>D(QCAC zlqcxx^qbwaY2xM<N-;Aq`;F#j#eQ0LHAJKa^HG<mNkkgTSgK?Ai*THEOG?gD1}Zbh zlyb_VMK+BlTiN3H9~t0pSEGzR(~M&J<NKu%BKOgB5@&g*^GlV=mFiwi>xOQ;XnYE; z(?yVn`8*qhvyc3A66V*Dvrp4>va!SHEFLc|o3D=3BoE_cJTt}dXpEGL^Eer$i$OY1 zMwyu>umP>>x_;SgEtkD_-M07kO>foqmi>MQ_F-?es_WMW-J=gzUvKZ0-&Ws$SZ)=z zp^=vk*YFd@qh;O%vt*JcUl8G{Dz@$zL|_9yimc}l6b6I=VPIz%aEGPd-<cK3LWBWf z;JFy!^TC5M`VI?==IFp+S^!`LZX>X{m*5)Dq3^J;hzLa4QlKqWuEkKc9DdK``3?(< zww#n}K9qa2avh2?Z^!(eNhjr7lu;NE1|BlNy&t5>_y7B+`+t)pgD@Zr>?Q-MG7N?T ztj*o6TdU-|)`MO_Svaq-xG8~Qu43f!RosFaf!|{T=sPSd!UK^X0Yiff!oWXe;5UU> BSiS%N literal 0 HcmV?d00001 diff --git a/workflow/main.nf b/workflow/main.nf index 29afb26..6c69eda 100644 --- a/workflow/main.nf +++ b/workflow/main.nf @@ -198,7 +198,7 @@ process experimentQC { output: - file '*.{png,npz}' into deepToolsStats + file '*.{pdf,npz}' into deepToolsStats script: diff --git a/workflow/scripts/experiment_qc.py b/workflow/scripts/experiment_qc.py index 7386fcf..affbbc4 100644 --- a/workflow/scripts/experiment_qc.py +++ b/workflow/scripts/experiment_qc.py @@ -76,10 +76,10 @@ def generate_read_summary(design, extension): return mbs_filename -def check_correlation(mbs): +def check_spearman_correlation(mbs): '''Check Spearman pairwise correlation of samples based on read counts.''' - spearman_filename = 'heatmap_SpearmanCorr.png' + spearman_filename = 'heatmap_SpearmanCorr.pdf' spearman_params = "--corMethod spearman --skipZero" + \ " --plotTitle \"Spearman Correlation of Read Counts\"" + \ " --whatToPlot heatmap --colorMap RdYlBu --plotNumbers" @@ -95,6 +95,25 @@ def check_correlation(mbs): out, err = spearman_correlation.communicate() +def check_pearson_correlation(mbs): + '''Check Pearson pairwise correlation of samples based on read counts.''' + + pearson_filename = 'heatmap_PearsonCorr.pdf' + pearson_params = "--corMethod pearson --skipZero" + \ + " --plotTitle \"Pearson Correlation of Read Counts\"" + \ + " --whatToPlot heatmap --colorMap RdYlBu --plotNumbers" + + pearson_command = ( + "plotCorrelation -in %s %s -o %s" + % (mbs, pearson_params, pearson_filename) + ) + + logger.info("Running deeptools with %s", pearson_command) + + pearson_correlation = subprocess.Popen(pearson_command, shell=True) + out, err = pearson_correlation.communicate() + + def check_coverage(design, extension): '''Asses the sequencing depth of samples.''' @@ -166,7 +185,9 @@ def main(): # Run correlation mbs_filename = generate_read_summary(design_df, extension) - check_correlation(mbs_filename) + check_spearman_correlation(mbs_filename) + check_pearson_correlation(mbs_filename) + # Run coverage check_coverage(design_df, extension) diff --git a/workflow/tests/test_experiment_qc.py b/workflow/tests/test_experiment_qc.py index 5256da5..6950950 100644 --- a/workflow/tests/test_experiment_qc.py +++ b/workflow/tests/test_experiment_qc.py @@ -33,7 +33,8 @@ def test_check_update_controls(design_bam): @pytest.mark.singleend def test_experiment_qc_singleend(): assert os.path.exists(os.path.join(test_output_path, 'sample_mbs.npz')) - assert os.path.exists(os.path.join(test_output_path, 'heatmap_SpearmanCorr.png')) + assert os.path.exists(os.path.join(test_output_path, 'heatmap_SpearmanCorr.pdf')) + assert os.path.exists(os.path.join(test_output_path, 'heatmap_PearsonCorr.pdf')) assert os.path.exists(os.path.join(test_output_path, 'coverage.png')) assert os.path.exists(os.path.join(test_output_path, 'ENCLB144FDT_fingerprint.png')) assert os.path.exists(os.path.join(test_output_path, 'ENCLB831RUI_fingerprint.png')) @@ -41,7 +42,8 @@ def test_experiment_qc_singleend(): @pytest.mark.pairdend def test_experiment_qc_pairedend(): assert os.path.exists(os.path.join(test_output_path, 'sample_mbs.npz')) - assert os.path.exists(os.path.join(test_output_path, 'heatmap_SpearmanCorr.png')) + assert os.path.exists(os.path.join(test_output_path, 'heatmap_SpearmanCorr.pdf')) + assert os.path.exists(os.path.join(test_output_path, 'heatmap_PearsonCorr.pdf')) assert os.path.exists(os.path.join(test_output_path, 'coverage.png')) assert os.path.exists(os.path.join(test_output_path, 'ENCLB568IYX_fingerprint.png')) assert os.path.exists(os.path.join(test_output_path, 'ENCLB637LZP_fingerprint.png')) -- GitLab