forked from johandahlberg/piper
-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathglobalConfig.sh
138 lines (120 loc) · 5.9 KB
/
globalConfig.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
# Start by exporting the shared drmaa libaries to the LD_LIBRARY_PATH
export LD_LIBRARY_PATH=/sw/apps/build/slurm-drmaa/default/lib/:$LD_LIBRARY_PATH
#---------------------------------------------
# Check if we are running on uppmax or locally, and set the jobrunners and path accordingly
#---------------------------------------------
if [ -f "/sw/apps/build/slurm-drmaa/default/lib/libdrmaa.so" ];
then
JOB_RUNNER=" Drmaa"
JOB_NATIVE_ARGS="-A ${PROJECT_ID} -p node -N 1 ${QOS}"
PATH_TO_BWA="/sw/apps/bioinfo/bwa/0.7.5a/milou/bin/bwa"
PATH_TO_SAMTOOLS="/sw/apps/bioinfo/samtools/0.1.19/milou/bin/samtools"
PATH_TO_RNA_SEQ_QC="/proj/b2010028/piper_resources/programs/RNA-SeQC_v1.1.7.jar"
PATH_TO_TOPHAT="/sw/apps/bioinfo/tophat/2.0.10/kalkyl/bin/tophat2"
PATH_TO_CUTADAPT="/sw/apps/bioinfo/cutadapt/1.2.1/kalkyl/bin/cutadapt"
PATH_TO_CUFFLINKS="/sw/apps/bioinfo/cufflinks/2.1.1/kalkyl/cufflinks"
PATH_TO_CUFFDIFF="/sw/apps/bioinfo/cufflinks/2.1.1/kalkyl/cuffdiff"
PATH_TO_QUALIMAP="/proj/b2010028/piper_resources/programs/qualimap_v1.0/qualimap"
PATH_TO_SYNC_CUTADAPT="/proj/b2010028/piper_resources/programs/FixEmptyReads.pl"
GATK_BUNDLE_B37="/proj/b2010028/references/piper_references/gatk_bundle/2.8/b37"
GATK_BUNDLE_HG19="/proj/b2010028/references/piper_references/gatk_bundle/2.8/hg19"
elif [ -f "/usr/lib/slurm-drmaa/lib/libdrmaa.so" ];
then
JOB_RUNNER=" Drmaa"
JOB_NATIVE_ARGS=""
PATH_TO_BWA="/data/programs/bwa-0.7.5a/bwa"
PATH_TO_SAMTOOLS="/data/programs/samtools-0.1.19/samtools"
PATH_TO_RNA_SEQ_QC="/data/programs/RNA-SeQC_v1.1.7.jar"
PATH_TO_TOPHAT="/data/programs/tophat-2.0.10.Linux_x86_64/tophat2"
PATH_TO_CUTADAPT="/data/programs/cutadapt/cutadapt-1.4.1/bin/cutadapt"
PATH_TO_CUFFLINKS="/data/programs/cufflinks-2.1.1.Linux_x86_64/cufflinks"
PATH_TO_CUFFDIFF="/data/programs/cufflinks-2.1.1.Linux_x86_64/cuffdiff"
PATH_TO_QUALIMAP="/data/programs/qualimap_v1.0/qualimap"
PATH_TO_SYNC_CUTADAPT="/data/programs/FixEmptyReads.pl"
GATK_BUNDLE_B37="/data/test_data/piper_references/gatk_bundle/2.8/b37"
GATK_BUNDLE_HG19="/data/test_data/piper_references/gatk_bundle/2.8/b37/hg19"
else
JOB_RUNNER=" Shell"
JOB_NATIVE_ARGS=""
PATH_TO_BWA="/data/programs/bwa-0.7.5a/bwa"
PATH_TO_SAMTOOLS="/data/programs/samtools-0.1.19/samtools"
PATH_TO_RNA_SEQ_QC="/data/programs/RNA-SeQC_v1.1.7.jar"
PATH_TO_TOPHAT="/data/programs/tophat-2.0.10.Linux_x86_64/tophat2"
PATH_TO_CUTADAPT="/data/programs/cutadapt/cutadapt-1.4.1/bin/cutadapt"
PATH_TO_CUFFLINKS="/data/programs/cufflinks-2.1.1.Linux_x86_64/cufflinks"
PATH_TO_CUFFDIFF="/data/programs/cufflinks-2.1.1.Linux_x86_64/cuffdiff"
PATH_TO_SYNC_CUTADAPT="/data/programs/FixEmptyReads.pl"
PATH_TO_QUALIMAP="/data/programs/qualimap_v1.0/qualimap"
GATK_BUNDLE_B37="/local/test_data/piper_references/gatk_bundle/2.8/b37"
GATK_BUNDLE_HG19="/local/test_data/piper_references/gatk_bundle/2.8/b37"
fi
#---------------------------------------------
# Paths to general resources
#---------------------------------------------
DB_SNP_B37=${GATK_BUNDLE_B37}"/dbsnp_138.b37.vcf"
MILLS_B37=${GATK_BUNDLE_B37}"/Mills_and_1000G_gold_standard.indels.b37.vcf"
ONE_K_G_B37=${GATK_BUNDLE_B37}"/1000G_phase1.indels.b37.vcf"
HAPMAP_B37=${GATK_BUNDLE_B37}"/hapmap_3.3.b37.vcf"
OMNI_B37=${GATK_BUNDLE_B37}"/1000G_omni2.5.b37.vcf"
MILLS_B37=${GATK_BUNDLE_B37}"/Mills_and_1000G_gold_standard.indels.b37.vcf"
THOUSAND_GENOMES_B37=${GATK_BUNDLE_B37}"/1000G_phase1.snps.high_confidence.b37.vcf"
DB_SNP_HG19=${GATK_BUNDLE_H19}"/dbsnp_138.hg19.vcf"
MILLS_HG19=${GATK_BUNDLE_H19}"/Mills_and_1000G_gold_standard.indels.hg19.vcf"
ONE_K_G_HG19=${GATK_BUNDLE_H19}"/1000G_phase1.indels.hg19.vcf"
HAPMAP_H19=${GATK_BUNDLE_HG19}"/hapmap_3.3.hg19.vcf"
OMNI_HG19=${GATK_BUNDLE_HG19}"/1000G_omni2.5.hg19.vcf"
MILLS_HG19=${GATK_BUNDLE_HG19}"/Mills_and_1000G_gold_standard.indels.hg19.vcf"
THOUSAND_GENOMES_HG19=${GATK_BUNDLE_HG19}"/1000G_phase1.snps.high_confidence.hg19.vcf"
#---------------------------------------------
# Global variables
#---------------------------------------------
# Note that the tmp folder needs to be placed in a location that can be reached from all nodes.
# Note that $SNIC_TMP cannot be used since that will lose necessary data as the nodes/core switch.
TMP=tmp/${PROJECT_NAME}
# Comment and uncomment DEBUG to enable/disable the debugging mode of the pipeline.
DEBUG="-l DEBUG" # -startFromScratch"
if [ ! -d "${TMP}" ]; then
mkdir -p ${TMP}
fi
JAVA_TMP="-Djava.io.tmpdir="${TMP}
#This will execute the removal of the tmp directory
trap clean_up SIGHUP SIGINT SIGTERM
QUEUE="${PWD}/lib/Queue.jar"
## Get location of globConfig script
_GLOB_CONF_LOCATION="$(readlink -f ${BASH_SOURCE[0]})"
_THIS_SCRIPT_LOCATION="$(dirname $_GLOB_CONF_LOCATION)"
SCRIPTS_DIR="${_THIS_SCRIPT_LOCATION}/../qscripts"
NBR_OF_THREADS=8
# Setup directory structure
PIPELINE_OUTPUT="pipeline_output"
RAW_BAM_OUTPUT=$PIPELINE_OUTPUT"/bam_files_raw"
RAW_MERGED_BAM_OUTPUT=$PIPELINE_OUTPUT"/bam_files_raw_merged"
ALIGNMENT_QC_OUTPUT=$PIPELINE_OUTPUT"/alignment_qc"
PROCESSED_BAM_OUTPUT=$PIPELINE_OUTPUT"/bam_files_processed"
CUFFLINKS_OUTPUT=$PIPELINE_OUTPUT"/cufflinks"
CUFFDIFF_OUTPUT=$PIPELINE_OUTPUT"/cuffdiff"
VCF_OUTPUT=$PIPELINE_OUTPUT"/vcf_files"
LOGS=$PIPELINE_OUTPUT"/logs"
RNA_QC_OUTPUT=$PIPELINE_OUTPUT"/RNA_QC"
# -----------------
# Utility functions
# -----------------
# Setup temporary directory for the the Qscript tmp files.
# This will be removed as long as the script dies gracefully
# (if it is killed with a kill -9, manual clean up will have to be run...)
function clean_up {
# Perform program exit housekeeping
rm -r ${TMP}
exit
}
# Move reports etc.
function final_clean_up {
# Move all the report files generated by Queue into a separate directory
if [ ! -d "reports" ]; then
mkdir "reports"
fi
mv *.jobreport.* reports/
# Remove the file temporary directory - otherwise it will fill up glob. And all the files which are required for
# the pipeline to run are written to the pipeline directory.
clean_up
}