Skip to content
Snippets Groups Projects
Commit daaf631d authored by Venkat Malladi's avatar Venkat Malladi
Browse files

Cleanup code after flake8.

parent a33eb4d4
Branches
Tags
No related merge requests found
...@@ -11,7 +11,7 @@ For more details: ...@@ -11,7 +11,7 @@ For more details:
%(prog)s --help %(prog)s --help
''' '''
## SETTINGS # SETTINGS
logger = logging.getLogger(__name__) logger = logging.getLogger(__name__)
logger.addHandler(logging.NullHandler()) logger.addHandler(logging.NullHandler())
...@@ -57,7 +57,7 @@ def check_design_headers(design, paired): ...@@ -57,7 +57,7 @@ def check_design_headers(design, paired):
design_headers = list(design.columns.values) design_headers = list(design.columns.values)
if paired: # paired-end data if paired: # paired-end data
design_template.extend(['fastq_read2']) design_template.extend(['fastq_read2'])
# Check if headers # Check if headers
...@@ -79,7 +79,8 @@ def check_controls(design): ...@@ -79,7 +79,8 @@ def check_controls(design):
if len(missing_controls) > 0: if len(missing_controls) > 0:
logger.error('Missing control experiments: %s', list(missing_controls)) logger.error('Missing control experiments: %s', list(missing_controls))
raise Exception("Missing control experiments: %s" % list(missing_controls)) raise Exception("Missing control experiments: %s" %
list(missing_controls))
def check_files(design, fastq, paired): def check_files(design, fastq, paired):
...@@ -87,9 +88,9 @@ def check_files(design, fastq, paired): ...@@ -87,9 +88,9 @@ def check_files(design, fastq, paired):
logger.info("Running file check.") logger.info("Running file check.")
if paired: # paired-end data if paired: # paired-end data
files = list(design['fastq_read1']) + list(design['fastq_read2']) files = list(design['fastq_read1']) + list(design['fastq_read2'])
else: # single-end data else: # single-end data
files = design['fastq_read1'] files = design['fastq_read1']
files_found = fastq['name'] files_found = fastq['name']
...@@ -98,13 +99,14 @@ def check_files(design, fastq, paired): ...@@ -98,13 +99,14 @@ def check_files(design, fastq, paired):
if len(missing_files) > 0: if len(missing_files) > 0:
logger.error('Missing files from design file: %s', list(missing_files)) logger.error('Missing files from design file: %s', list(missing_files))
raise Exception("Missing files from design file: %s" % list(missing_files)) raise Exception("Missing files from design file: %s" %
list(missing_files))
else: else:
file_dict = fastq.set_index('name').T.to_dict() file_dict = fastq.set_index('name').T.to_dict()
design['fastq_read1'] = design['fastq_read1'] \ design['fastq_read1'] = design['fastq_read1'] \
.apply(lambda x: file_dict[x]['path']) .apply(lambda x: file_dict[x]['path'])
if paired: # paired-end data if paired: # paired-end data
design['fastq_read2'] = design['fastq_read2'] \ design['fastq_read2'] = design['fastq_read2'] \
.apply(lambda x: file_dict[x]['path']) .apply(lambda x: file_dict[x]['path'])
return design return design
......
...@@ -8,7 +8,6 @@ import argparse ...@@ -8,7 +8,6 @@ import argparse
import shutil import shutil
import shlex import shlex
import logging import logging
import sys
from multiprocessing import cpu_count from multiprocessing import cpu_count
import json import json
import utils import utils
...@@ -18,7 +17,7 @@ For more details: ...@@ -18,7 +17,7 @@ For more details:
%(prog)s --help %(prog)s --help
''' '''
## SETTINGS # SETTINGS
logger = logging.getLogger(__name__) logger = logging.getLogger(__name__)
logger.addHandler(logging.NullHandler()) logger.addHandler(logging.NullHandler())
...@@ -56,8 +55,7 @@ def get_args(): ...@@ -56,8 +55,7 @@ def get_args():
return args return args
# Functions
## Functions
def check_tools(): def check_tools():
...@@ -102,7 +100,6 @@ def generate_sa(fastq, reference): ...@@ -102,7 +100,6 @@ def generate_sa(fastq, reference):
def align_se(fastq, sai, reference, fastq_basename): def align_se(fastq, sai, reference, fastq_basename):
'''Use BWA to align SE data.''' '''Use BWA to align SE data.'''
sam_filename = "%s.sam" % (fastq_basename)
bam_filename = '%s.srt.bam' % (fastq_basename) bam_filename = '%s.srt.bam' % (fastq_basename)
steps = [ steps = [
...@@ -118,6 +115,7 @@ def align_se(fastq, sai, reference, fastq_basename): ...@@ -118,6 +115,7 @@ def align_se(fastq, sai, reference, fastq_basename):
return bam_filename return bam_filename
def align_pe(fastq, sai, reference, fastq_basename): def align_pe(fastq, sai, reference, fastq_basename):
'''Use BWA to align PE data.''' '''Use BWA to align PE data.'''
...@@ -173,7 +171,7 @@ def main(): ...@@ -173,7 +171,7 @@ def main():
sai.append(sai_filename) sai.append(sai_filename)
# Run alignment for either PE or SE # Run alignment for either PE or SE
if paired: # paired-end data if paired: # paired-end data
fastq_r1_basename = os.path.basename( fastq_r1_basename = os.path.basename(
utils.strip_extensions(fastq[0], STRIP_EXTENSIONS)) utils.strip_extensions(fastq[0], STRIP_EXTENSIONS))
fastq_r2_basename = os.path.basename( fastq_r2_basename = os.path.basename(
......
...@@ -2,19 +2,17 @@ ...@@ -2,19 +2,17 @@
'''Trim low quality reads and remove sequences less than 35 base pairs.''' '''Trim low quality reads and remove sequences less than 35 base pairs.'''
import os
import subprocess import subprocess
import argparse import argparse
import shutil import shutil
import logging import logging
import sys
EPILOG = ''' EPILOG = '''
For more details: For more details:
%(prog)s --help %(prog)s --help
''' '''
## SETTINGS # SETTINGS
logger = logging.getLogger(__name__) logger = logging.getLogger(__name__)
logger.addHandler(logging.NullHandler()) logger.addHandler(logging.NullHandler())
...@@ -65,7 +63,7 @@ def check_tools(): ...@@ -65,7 +63,7 @@ def check_tools():
def trim_reads(fastq, paired): def trim_reads(fastq, paired):
'''Run trim_galore on 1 or 2 files.''' '''Run trim_galore on 1 or 2 files.'''
if paired: # paired-end data if paired: # paired-end data
trim_params = '--paired -q 25 --illumina --gzip --length 35' trim_params = '--paired -q 25 --illumina --gzip --length 35'
trim_command = "trim_galore %s %s %s " \ trim_command = "trim_galore %s %s %s " \
% (trim_params, fastq[0], fastq[1]) % (trim_params, fastq[0], fastq[1])
......
...@@ -3,9 +3,6 @@ ...@@ -3,9 +3,6 @@
'''General utilities.''' '''General utilities.'''
import sys
import os
import subprocess
import shlex import shlex
import logging import logging
......
#!/usr/bin/env python3 #!/usr/bin/env python3
import os
import pytest import pytest
import pandas as pd import pandas as pd
from io import StringIO from io import StringIO
import check_design import check_design
import sys
DESIGN_STRING = """sample_id\tbiosample\tfactor\ttreatment\treplicate\tcontrol_id\tfastq_read1 DESIGN_STRING = """sample_id\tbiosample\tfactor\ttreatment\treplicate\tcontrol_id\tfastq_read1
...@@ -49,11 +47,12 @@ def design_2(design): ...@@ -49,11 +47,12 @@ def design_2(design):
design_df = design.drop(design.index[2]) design_df = design.drop(design.index[2])
return design_df return design_df
@pytest.fixture @pytest.fixture
def design_3(design): def design_3(design):
# Drop A_2 and B_2 and append as fastq_read2 # Drop A_2 and B_2 and append as fastq_read2
design_df = design.drop(design.index[[1,3]]) design_df = design.drop(design.index[[1, 3]])
design_df['fastq_read2'] = design.loc[[1,3],'fastq_read1'].values design_df['fastq_read2'] = design.loc[[1, 3], 'fastq_read1'].values
return design_df return design_df
...@@ -94,10 +93,10 @@ def test_check_files_missing_files(design, fastq_files_1): ...@@ -94,10 +93,10 @@ def test_check_files_missing_files(design, fastq_files_1):
def test_check_files_output_singleend(design, fastq_files): def test_check_files_output_singleend(design, fastq_files):
paired = False paired = False
new_design = check_design.check_files(design, fastq_files, paired) new_design = check_design.check_files(design, fastq_files, paired)
assert new_design.loc[0,'fastq_read1'] == "/path/to/file/A_1.fastq.gz" assert new_design.loc[0, 'fastq_read1'] == "/path/to/file/A_1.fastq.gz"
def test_check_files_output_pairedend(design_3, fastq_files): def test_check_files_output_pairedend(design_3, fastq_files):
paired = True paired = True
new_design = check_design.check_files(design_3, fastq_files, paired) new_design = check_design.check_files(design_3, fastq_files, paired)
assert new_design.loc[0,'fastq_read2'] == "/path/to/file/A_2.fastq.gz" assert new_design.loc[0, 'fastq_read2'] == "/path/to/file/A_2.fastq.gz"
#!/usr/bin/env python3 #!/usr/bin/env python3
import pytest import pytest
import shutil
import shlex
import utils import utils
STRIP_EXTENSIONS = ['.gz', '.fq', '.fastq', '.fa', '.fasta'] STRIP_EXTENSIONS = ['.gz', '.fq', '.fastq', '.fa', '.fasta']
@pytest.fixture @pytest.fixture
def steps(): def steps():
steps = [] steps = []
...@@ -56,15 +55,15 @@ def test_run_last_step_file(steps_2, capsys, tmpdir): ...@@ -56,15 +55,15 @@ def test_run_last_step_file(steps_2, capsys, tmpdir):
def test_strip_extensions(): def test_strip_extensions():
filename = utils.strip_extensions('ENCFF833BLU.fastq.gz',STRIP_EXTENSIONS) filename = utils.strip_extensions('ENCFF833BLU.fastq.gz', STRIP_EXTENSIONS)
assert filename == 'ENCFF833BLU' assert filename == 'ENCFF833BLU'
def test_strip_extensions_not_valid(): def test_strip_extensions_not_valid():
filename = utils.strip_extensions('ENCFF833BLU.not.valid',STRIP_EXTENSIONS) filename = utils.strip_extensions('ENCFF833BLU.not.valid', STRIP_EXTENSIONS)
assert filename == 'ENCFF833BLU.not.valid' assert filename == 'ENCFF833BLU.not.valid'
def test_strip_extensions_missing_basename(): def test_strip_extensions_missing_basename():
filename = utils.strip_extensions('.fastq.gz',STRIP_EXTENSIONS) filename = utils.strip_extensions('.fastq.gz', STRIP_EXTENSIONS)
assert filename == '.fastq' assert filename == '.fastq'
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment