From 1487eaa6439dfd9d1403d004ce3e532b7690b123 Mon Sep 17 00:00:00 2001 From: Venkat Malladi <venkat.malladi@utsouthwestern.edu> Date: Thu, 14 Jun 2018 14:26:50 -0500 Subject: [PATCH] Make pipeline to astrocyte standards. --- astrocyte_pkg.yml | 114 ++++++++++++++++++++++++++++++++++++ docs/index.md | 3 + workflow/conf/biohpc.config | 20 ------- workflow/main.nf | 6 +- 4 files changed, 120 insertions(+), 23 deletions(-) create mode 100644 astrocyte_pkg.yml create mode 100644 docs/index.md diff --git a/astrocyte_pkg.yml b/astrocyte_pkg.yml new file mode 100644 index 0000000..c6c16bf --- /dev/null +++ b/astrocyte_pkg.yml @@ -0,0 +1,114 @@ +# +# metadata for the Astrocyte CellRanger mkfastq workflow package +# + +# ----------------------------------------------------------------------------- +# BASIC INFORMATION +# ----------------------------------------------------------------------------- + +# A unique identifier for the workflow package, text/underscores only +name: 'cellranger_mkfastq' +# Who wrote this? +author: 'Gervaise Henry and Venkat Malladi' +# A contact email address for questions +email: 'bicf@utsouthwestern.edu' +# A more informative title for the workflow package +title: 'BICF CellRanger mkfastq Workflow' +# A summary of the workflow package in plain text +description: | + This is a workflow package for the BICF/Strand Lab CellRanger mkfastq workflow system. + It implements 10x CellRanger mkfastq analysis workflow application. + +# ----------------------------------------------------------------------------- +# DOCUMENTATION +# ----------------------------------------------------------------------------- + +# A list of documentation file in .md format that should be viewable from the +# web interface. These files are in the 'docs' subdirectory. The first file +# listed will be used as a documentation index and is index.md by convention +documentation_files: + - ['index.md'] + +# ----------------------------------------------------------------------------- +# NEXTFLOW WORKFLOW CONFIGURATION +# ----------------------------------------------------------------------------- + +# Remember - The workflow file is always named 'workflow/main.nf' +# The workflow must publish all final output into $baseDir + +# A list of cluster environment modules that this workflow requires to run. +# Specify versioned module names to ensure reproducability. +workflow_modules: + - 'python/3.6.1-2-anaconda' + - 'cellranger/2.1.1' + - 'bcl2fastq/2.17.1.14' + +# A list of parameters used by the workflow, defining how to present them, +# options etc in the web interface. For each parameter: +# +# REQUIRED INFORMATION +# id: The name of the parameter in the NEXTFLOW workflow +# type: The type of the parameter, one of: +# string - A free-format string +# integer - An integer +# real - A real number +# file - A single file from user data +# files - One or more files from user data +# select - A selection from a list of values +# required: true/false, must the parameter be entered/chosen? +# description: A user friendly description of the meaning of the parameter +# +# OPTIONAL INFORMATION +# default: A default value for the parameter (optional) +# min: Minium value/characters/files for number/string/files types +# max: Maxumum value/characters/files for number/string/files types +# regex: A regular expression that describes valid entries / filenames +# +# SELECT TYPE +# choices: A set of choices presented to the user for the parameter. +# Each choice is a pair of value and description, e.g. +# +# choices: +# - [ 'myval', 'The first option'] +# - [ 'myval', 'The second option'] +# +# NOTE - All parameters are passed to NEXTFLOW as strings... but they +# are validated by astrocyte using the information provided above + +workflow_parameters: + + - id: bcl + type: files + required: true + description: | + One or more input Tarball BCL files from a sequencing of 10x single-cell expereiment . + regex: ".*(tar)*" + + - id: design + type: file + required: true + description: | + A design file listing lane, sample, corresponding index. + + +# ----------------------------------------------------------------------------- +# SHINY APP CONFIGURATION +# ----------------------------------------------------------------------------- + +# Remember - The vizapp is always 'vizapp/server.R' 'vizapp/ui.R' +# The workflow must publish all final output into $baseDir + +# Name of the R module that the vizapp will run against +vizapp_r_module: 'R/3.2.1-intel' + +# List of any CRAN packages, not provided by the modules, that must be made +# available to the vizapp +vizapp_cran_packages: + - shiny + - shinyFiles + +# List of any Bioconductor packages, not provided by the modules, +# that must be made available to the vizapp +vizapp_bioc_packages: + +vizapp_github_packages: diff --git a/docs/index.md b/docs/index.md new file mode 100644 index 0000000..654bef8 --- /dev/null +++ b/docs/index.md @@ -0,0 +1,3 @@ +# Astrocyte CellRanger 10x Workflow Package + +## Workflow SOP diff --git a/workflow/conf/biohpc.config b/workflow/conf/biohpc.config index 360f31a..bb45b43 100644 --- a/workflow/conf/biohpc.config +++ b/workflow/conf/biohpc.config @@ -16,26 +16,6 @@ process { } } -params { - // Reference file paths on BioHPC - genomes { - 'ercc92' { - ref = '/project/apps_database/cellranger/refdata-cellranger-ercc92-1.2.0' - } - 'GRCh38' { - ref = '/project/apps_database/cellranger/refdata-cellranger-GRCh38-1.2.0' - } - 'hg19' { - ref = '/project/apps_database/cellranger/refdata-cellranger-hg19-1.2.0' - } - 'mm10' { - ref = '/project/apps_database/cellranger/refdata-cellranger-mm10-1.2.0' - } - 'hg19.mm10' { - ref = '/project/apps_database/cellranger/refdata-cellranger-hg19_and_mm10-1.2.0' - } - } -} trace { enabled = true diff --git a/workflow/main.nf b/workflow/main.nf index 9663e00..18e01b0 100644 --- a/workflow/main.nf +++ b/workflow/main.nf @@ -6,7 +6,7 @@ // Define Input variables params.bcl = "$baseDir/../test_data/*.tar" params.designFile = "$baseDir/../test_data/design.csv" -params.genome = 'GRCm38' + // Define List of Files tarList = Channel.fromPath( params.bcl ) @@ -51,7 +51,7 @@ process untarBCL { script: """ - + tar -xvf $tar """ } @@ -60,7 +60,7 @@ process untarBCL { process mkfastq { tag "${bcl.baseName}" - publishDir "$baseDir/output/fastq/${bcl.baseName}", mode: 'copy' + publishDir "$baseDir/output/fastq/${bcl.baseName}", mode: 'copy' input: -- GitLab