From 2d455586062742ee790332b32b27aab8892c1d45 Mon Sep 17 00:00:00 2001
From: Brandi Cantarel <brandi.cantarel@utsouthwestern.edu>
Date: Wed, 27 Feb 2019 20:52:41 -0600
Subject: [PATCH] update GRCh38-> human/GRCh38

---
 alignment/bamqc.sh                    | 2 +-
 alignment/dnaseqalign.sh              | 2 +-
 alignment/filter_genefusions.pl       | 4 ++--
 alignment/markdups.sh                 | 2 +-
 alignment/rnaseqalign.sh              | 2 +-
 alignment/starfusion.sh               | 4 ++--
 genect_rnaseq/cBioPortal_documents.pl | 2 +-
 variants/cnvkit.sh                    | 6 +++---
 variants/filter_cnvkit.pl             | 2 +-
 variants/somatic_callers.sh           | 4 ++--
 10 files changed, 15 insertions(+), 15 deletions(-)

diff --git a/alignment/bamqc.sh b/alignment/bamqc.sh
index eefb332..029a921 100644
--- a/alignment/bamqc.sh
+++ b/alignment/bamqc.sh
@@ -8,7 +8,7 @@ usage() {
   echo "-n  --NucType"
   echo "-p  --Prefix for output file name"
   echo "-c  --Capture Bedfile"
-  echo "Example: bash bamqc.sh -p prefix -r /project/shared/bicf_workflow_ref/GRCh38 -b SRR1551047.bam  -n dna -c target.bed"
+  echo "Example: bash bamqc.sh -p prefix -r /project/shared/bicf_workflow_ref/human/GRCh38 -b SRR1551047.bam  -n dna -c target.bed"
   exit 1
 }
 OPTIND=1 # Reset OPTIND
diff --git a/alignment/dnaseqalign.sh b/alignment/dnaseqalign.sh
index 36a1364..9ae193d 100644
--- a/alignment/dnaseqalign.sh
+++ b/alignment/dnaseqalign.sh
@@ -8,7 +8,7 @@ usage() {
   echo "-y  --FastQ R2"
   echo "-p  --Prefix for output file name"
   echo "-u  --UMI"
-  echo "Example: bash dnaseqalign.sh -p prefix -u 1 -r /project/shared/bicf_workflow_ref/GRCh38 -x SRR1551047_1.fastq.gz  -y SRR1551047_2.fastq.gz"
+  echo "Example: bash dnaseqalign.sh -p prefix -u 1 -r /project/shared/bicf_workflow_ref/human/GRCh38 -x SRR1551047_1.fastq.gz  -y SRR1551047_2.fastq.gz"
   exit 1
 }
 OPTIND=1 # Reset OPTIND
diff --git a/alignment/filter_genefusions.pl b/alignment/filter_genefusions.pl
index f44cf58..1c43cd3 100755
--- a/alignment/filter_genefusions.pl
+++ b/alignment/filter_genefusions.pl
@@ -14,13 +14,13 @@ while (my $line = <ENT>) {
       $entrez{$row[2]} = $row[1];
   }
 }
-open OM, "</project/shared/bicf_workflow_ref/GRCh38/clinseq_prj/utswv2_known_genefusions.txt" or die $!;
+open OM, "</project/shared/bicf_workflow_ref/human/GRCh38/clinseq_prj/utswv2_known_genefusions.txt" or die $!;
 while (my $line = <OM>) {
     chomp($line);
     $known{$line} = 1;
 }
 close OM;
-open OM, "</project/shared/bicf_workflow_ref/GRCh38/clinseq_prj/panel1410.genelist.txt" or die $!;
+open OM, "</project/shared/bicf_workflow_ref/human/GRCh38/clinseq_prj/panel1410.genelist.txt" or die $!;
 while (my $line = <OM>) {
     chomp($line);
     $keep{$line} = 1;
diff --git a/alignment/markdups.sh b/alignment/markdups.sh
index 6338711..b794b25 100644
--- a/alignment/markdups.sh
+++ b/alignment/markdups.sh
@@ -63,7 +63,7 @@ then
     samtools fastq -1 ${pair_id}.consensus.R1.fastq -2 ${pair_id}.consensus.R2.fastq ${pair_id}.consensus.bam
     gzip ${pair_id}.consensus.R1.fastq
     gzip ${pair_id}.consensus.R2.fastq
-    bwa mem -M -C -t 2 -R "@RG\tID:${pair_id}\tLB:tx\tPL:illumina\tPU:barcode\tSM:${pair_id}" /project/shared/bicf_workflow_ref/GRCh38/genome.fa ${pair_id}.consensus.R1.fastq.gz ${pair_id}.consensus.R2.fastq.gz | samtools view -1 - > ${pair_id}.consensus.bam
+    bwa mem -M -C -t 2 -R "@RG\tID:${pair_id}\tLB:tx\tPL:illumina\tPU:barcode\tSM:${pair_id}" /project/shared/bicf_workflow_ref/human/GRCh38/genome.fa ${pair_id}.consensus.R1.fastq.gz ${pair_id}.consensus.R2.fastq.gz | samtools view -1 - > ${pair_id}.consensus.bam
     samtools sort --threads 10 -o ${pair_id}.dedup.bam ${pair_id}.consensus.bam
 else
     cp ${sbam} ${pair_id}.dedup.bam    
diff --git a/alignment/rnaseqalign.sh b/alignment/rnaseqalign.sh
index 182a738..606af0a 100644
--- a/alignment/rnaseqalign.sh
+++ b/alignment/rnaseqalign.sh
@@ -9,7 +9,7 @@ usage() {
   echo "-a  --Method: hisat or star"
   echo "-p  --Prefix for output file name"
   echo "-u  --UMI sequences are in FQ Read Name"
-  echo "Example: bash rnaseqalign.sh -a hisat -p prefix -u -r /project/shared/bicf_workflow_ref/GRCh38 -x SRR1551047_1.fastq.gz  -y SRR1551047_2.fastq.gz"
+  echo "Example: bash rnaseqalign.sh -a hisat -p prefix -u -r /project/shared/bicf_workflow_ref/human/GRCh38 -x SRR1551047_1.fastq.gz  -y SRR1551047_2.fastq.gz"
   exit 1
 }
 OPTIND=1 # Reset OPTIND
diff --git a/alignment/starfusion.sh b/alignment/starfusion.sh
index d462f5a..3e1ec53 100644
--- a/alignment/starfusion.sh
+++ b/alignment/starfusion.sh
@@ -7,7 +7,7 @@ usage() {
   echo "-a  --FastQ R1"
   echo "-b  --FastQ R2"
   echo "-p  --Prefix for output file name"
-  echo "Example: bash starfusion.sh -p prefix -r /project/shared/bicf_workflow_ref/GRCh38 -a SRR1551047_1.fastq.gz  -b SRR1551047_2.fastq.gz"
+  echo "Example: bash starfusion.sh -p prefix -r /project/shared/bicf_workflow_ref/human/GRCh38 -a SRR1551047_1.fastq.gz  -b SRR1551047_2.fastq.gz"
   exit 1
 }
 OPTIND=1 # Reset OPTIND
@@ -67,7 +67,7 @@ cut -f 5-8 ${pair_id}.starfusion.txt |perl -pe 's/\^|:/\t/g' | awk '{print "sing
 if [[ $filter == 1 ]]
 then
     cut -f 6,8 ${pair_id}.starfusion.txt |grep -v Breakpoint |perl -pe 's/\t/\n/g' |awk -F ':' '{print $1"\t"$2-1"\t"$2}' > temp.bed
-    bedtools intersect -wao -a temp.bed -b /project/shared/bicf_workflow_ref/GRCh38/cytoBand.txt |cut -f 1,2,7 > cytoband_pos.txt
+    bedtools intersect -wao -a temp.bed -b /project/shared/bicf_workflow_ref/human/GRCh38/cytoBand.txt |cut -f 1,2,7 > cytoband_pos.txt
     perl $baseDir/filter_genefusions.pl -p ${pair_id} -f ${pair_id}.starfusion.txt
 fi
 
diff --git a/genect_rnaseq/cBioPortal_documents.pl b/genect_rnaseq/cBioPortal_documents.pl
index 25a816e..5b672a3 100644
--- a/genect_rnaseq/cBioPortal_documents.pl
+++ b/genect_rnaseq/cBioPortal_documents.pl
@@ -15,7 +15,7 @@ while (my $line = <ENT_ENS>){
   $entrez{$row[2]}=$row[1];
 }
 close ENT_ENS;
-open ENT_ENS, "</project/shared/bicf_workflow_ref/GRCh38/genenames.txt" or die $!;
+open ENT_ENS, "</project/shared/bicf_workflow_ref/human/GRCh38/genenames.txt" or die $!;
 my $gn_header = <ENT_ENS>;
 my %ensym;
 while (my $line = <ENT_ENS>){
diff --git a/variants/cnvkit.sh b/variants/cnvkit.sh
index ea813fb..743167f 100755
--- a/variants/cnvkit.sh
+++ b/variants/cnvkit.sh
@@ -26,7 +26,7 @@ done
 
 shift $(($OPTIND -1))
 
-index_path='/project/shared/bicf_workflow_ref/GRCh38/clinseq_prj/'
+index_path='/project/shared/bicf_workflow_ref/human/GRCh38/clinseq_prj/'
 
 # Check for mandatory options
 if [[ -z $pair_id ]] || [[ -z $sbam ]]; then
@@ -38,7 +38,7 @@ then
 fi
 baseDir="`dirname \"$0\"`"
 
-if [[ $capture == '/project/shared/bicf_workflow_ref/GRCh38/clinseq_prj/UTSWV2.bed' ]]
+if [[ $capture == '/project/shared/bicf_workflow_ref/human/GRCh38/clinseq_prj/UTSWV2.bed' ]]
 then 
     normals="${index_path}/UTSWV2.normals.cnn"
     targets="${index_path}/UTSWV2.cnvkit_"
@@ -64,5 +64,5 @@ cnvkit.py fix ${pair_id}.targetcoverage.cnn ${pair_id}.antitargetcoverage.cnn ${
 cnvkit.py segment ${pair_id}.cnr -o ${pair_id}.cns
 cnvkit.py call ${pair_id}.cns -o ${pair_id}.call.cns
 cnvkit.py scatter ${pair_id}.cnr -s ${pair_id}.call.cns -t --segment-color "blue" -o ${pair_id}.cnv.scatter.pdf
-cut -f 1,2,3 ${pair_id}.call.cns | grep -v chrom | bedtools intersect -wao -b /project/shared/bicf_workflow_ref/GRCh38/cytoBand.txt -a stdin |cut -f 1,2,3,7 >  ${pair_id}.cytoband.bed
+cut -f 1,2,3 ${pair_id}.call.cns | grep -v chrom | bedtools intersect -wao -b /project/shared/bicf_workflow_ref/human/GRCh38/cytoBand.txt -a stdin |cut -f 1,2,3,7 >  ${pair_id}.cytoband.bed
 perl $baseDir/filter_cnvkit.pl *.call.cns
diff --git a/variants/filter_cnvkit.pl b/variants/filter_cnvkit.pl
index b7504ad..b4ddacc 100755
--- a/variants/filter_cnvkit.pl
+++ b/variants/filter_cnvkit.pl
@@ -1,7 +1,7 @@
 #!/usr/bin/perl -w
 #parse_cnvkit_table.pl
 
-my $refdir = '/project/shared/bicf_workflow_ref/GRCh38/';
+my $refdir = '/project/shared/bicf_workflow_ref/human/GRCh38/';
 open OM, "<$refdir\/clinseq_prj/panel1410.genelist.txt" or die $!;
 while (my $line = <OM>) {
   chomp($line);
diff --git a/variants/somatic_callers.sh b/variants/somatic_callers.sh
index 4517c52..1adde7b 100755
--- a/variants/somatic_callers.sh
+++ b/variants/somatic_callers.sh
@@ -36,7 +36,7 @@ if [[ -z $SLURM_CPUS_ON_NODE ]]
     SLURM_CPUS_ON_NODE=1
 fi
 
-index_path=/project/shared/bicf_workflow_ref/GRCh38
+index_path=/project/shared/bicf_workflow_ref/human/GRCh38
 
 genome_reference=${index_path}/genome.fa
 cosmic_reference=${index_path}/cosmic.vcf.gz
@@ -76,7 +76,7 @@ fi
 if [ $algo == 'mutect' ]
   then
     module load parallel python/2.7.x-anaconda gatk/3.8  bcftools/intel/1.3 bedtools/2.25.0 snpeff/4.2 vcftools/0.1.14
-    cut -f 1 /project/shared/bicf_workflow_ref/GRCh38/genomefile.5M.txt | parallel --delay 2 -j 10 "java -Xmx20g -jar $GATK_JAR -R ${genome_reference} -D ${dbSnp_reference} -T MuTect2 -stand_call_conf 30 -stand_emit_conf 10.0 -A FisherStrand -A QualByDepth -A VariantType -A DepthPerAlleleBySample -A HaplotypeScore -A AlleleBalance -I:tumor ${tumor}.final.bam -I:normal ${normal}.final.bam --cosmic ${cosmic} -o ${tumor}.{}.mutect.vcf -L {}"
+    cut -f 1 /project/shared/bicf_workflow_ref/human/GRCh38/genomefile.5M.txt | parallel --delay 2 -j 10 "java -Xmx20g -jar $GATK_JAR -R ${genome_reference} -D ${dbSnp_reference} -T MuTect2 -stand_call_conf 30 -stand_emit_conf 10.0 -A FisherStrand -A QualByDepth -A VariantType -A DepthPerAlleleBySample -A HaplotypeScore -A AlleleBalance -I:tumor ${tumor}.final.bam -I:normal ${normal}.final.bam --cosmic ${cosmic} -o ${tumor}.{}.mutect.vcf -L {}"
     vcf-concat ${tumor}*.vcf | vcf-sort | vcf-annotate -n --fill-type | java -jar $SNPEFF_HOME/SnpSift.jar filter -p '((FS <= 60) & GEN[*].DP >= 10)' | perl -pe 's/TUMOR/'${tumor}'/' | perl -pe 's/NORMAL/'${normal}'/g' |bgzip > ${tumor}_${normal}.mutect.vcf.gz
 fi
 
-- 
GitLab