Skip to content

Commit

Permalink
Nf core vc (#7)
Browse files Browse the repository at this point in the history
* Add Annotation
* Annotation containers are tagged version.genomeversion
* Better indentation
* Replace `--sampleDir` by `--sample`
* add MultiQC
* update Tests
* Add parallelized testing on Travis
* Add parallelized building of Docker Images for annotation on CircleCI
* Update docs
  • Loading branch information
maxulysse authored May 8, 2019
1 parent 8c5a875 commit 3c5f236
Show file tree
Hide file tree
Showing 14 changed files with 2,363 additions and 1,153 deletions.
111 changes: 111 additions & 0 deletions .circleci/config.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,111 @@
version: 2.0
jobs:
snpeffgrch37:
docker:
- image: circleci/buildpack-deps:stretch
environment:
GENOME: GRCh37
SNPEFF_CACHE_VERSION: 75
steps:
- checkout
- setup_remote_docker
- run:
command: docker build -t nfcore/sareksnpeff:dev.${GENOME} containers/snpeff/. --build-arg GENOME=${GENOME} --build-arg SNPEFF_CACHE_VERSION=${SNPEFF_CACHE_VERSION}
- run:
command: |
echo "$DOCKERHUB_PASS" | docker login -u "$DOCKERHUB_USERNAME" --password-stdin
docker push nfcore/sareksnpeff:dev.${GENOME}
snpeffgrch38:
docker:
- image: circleci/buildpack-deps:stretch
environment:
GENOME: GRCh38
SNPEFF_CACHE_VERSION: 86
steps:
- checkout
- setup_remote_docker
- run:
command: docker build -t nfcore/sareksnpeff:dev.${GENOME} containers/snpeff/. --build-arg GENOME=${GENOME} --build-arg SNPEFF_CACHE_VERSION=${SNPEFF_CACHE_VERSION}
- run:
command: |
echo "$DOCKERHUB_PASS" | docker login -u "$DOCKERHUB_USERNAME" --password-stdin
docker push nfcore/sareksnpeff:dev.${GENOME}
snpeffgrcm38:
docker:
- image: circleci/buildpack-deps:stretch
environment:
GENOME: GRCm38
SNPEFF_CACHE_VERSION: 86
steps:
- checkout
- setup_remote_docker
- run:
command: docker build -t nfcore/sareksnpeff:dev.${GENOME} containers/snpeff/. --build-arg GENOME=${GENOME} --build-arg SNPEFF_CACHE_VERSION=${SNPEFF_CACHE_VERSION}
- run:
command: |
echo "$DOCKERHUB_PASS" | docker login -u "$DOCKERHUB_USERNAME" --password-stdin
docker push nfcore/sareksnpeff:dev.${GENOME}
vepgrch37:
docker:
- image: circleci/buildpack-deps:stretch
environment:
GENOME: GRCh37
SPECIES: homo_sapiens
VEP_VERSION: 95
steps:
- checkout
- setup_remote_docker
- run:
command: docker build -t nfcore/sarekvep:dev.${GENOME} containers/vep/. --build-arg GENOME=${GENOME} --build-arg SPECIES=${SPECIES} --build-arg VEP_VERSION=${VEP_VERSION}
no_output_timeout: 45m
- run:
command: echo "$DOCKERHUB_PASS" | docker login -u "$DOCKERHUB_USERNAME" --password-stdin ; docker push nfcore/sarekvep:dev.${GENOME}
no_output_timeout: 45m

vepgrch38:
docker:
- image: circleci/buildpack-deps:stretch
environment:
GENOME: GRCh38
SPECIES: homo_sapiens
VEP_VERSION: 95
steps:
- checkout
- setup_remote_docker
- run:
command: docker build -t nfcore/sarekvep:dev.${GENOME} containers/vep/. --build-arg GENOME=${GENOME} --build-arg SPECIES=${SPECIES} --build-arg VEP_VERSION=${VEP_VERSION}
no_output_timeout: 45m
- run:
command: echo "$DOCKERHUB_PASS" | docker login -u "$DOCKERHUB_USERNAME" --password-stdin ; docker push nfcore/sarekvep:dev.${GENOME}
no_output_timeout: 45m

vepgrcm38:
docker:
- image: circleci/buildpack-deps:stretch
environment:
GENOME: GRCm38
SPECIES: mus_musculus
VEP_VERSION: 95
steps:
- checkout
- setup_remote_docker
- run:
command: docker build -t nfcore/sarekvep:dev.${GENOME} containers/vep/. --build-arg GENOME=${GENOME} --build-arg SPECIES=${SPECIES} --build-arg VEP_VERSION=${VEP_VERSION}
no_output_timeout: 45m
- run:
command: echo "$DOCKERHUB_PASS" | docker login -u "$DOCKERHUB_USERNAME" --password-stdin ; docker push nfcore/sarekvep:dev.${GENOME}
no_output_timeout: 45m

workflows:
version: 2
build:
jobs:
- snpeffgrch37
- snpeffgrch38
- snpeffgrcm38
- vepgrch37
- vepgrch38
- vepgrcm38
22 changes: 15 additions & 7 deletions .travis.yml
Original file line number Diff line number Diff line change
Expand Up @@ -14,15 +14,20 @@ matrix:
fast_finish: true

env:
- NXF_VER=19.04.0
global:
- NXF_VER=19.04.0
matrix:
- TEST=SOMATIC
- TEST=GERMLINE
- TEST=TARGETED
- TEST=ANNOTATEVEP
- TEST=ANNOTATESNPEFF

before_install:
# PRs to master are only ok if coming from dev branch
- '[ $TRAVIS_PULL_REQUEST = "false" ] || [ $TRAVIS_BRANCH != "master" ] || ([ $TRAVIS_PULL_REQUEST_SLUG = $TRAVIS_REPO_SLUG ] && [ $TRAVIS_PULL_REQUEST_BRANCH = "dev" ])'
# Pull the docker image first so the test doesn't wait for this
- docker pull nfcore/sarek:dev
# Fake the tag locally so that the pipeline runs properly
- docker tag nfcore/sarek:dev nfcore/sarek:dev
- "travis_retry ./bin/download_docker.sh --test $TEST"

install:
# Install Nextflow
Expand All @@ -32,7 +37,10 @@ install:
# Reset
- mkdir ${TRAVIS_BUILD_DIR}/tests && cd ${TRAVIS_BUILD_DIR}/tests

# Build references if needed
before_script:
- "${TRAVIS_BUILD_DIR}/bin/build_reference.sh --test $TEST --build"

# Actual tests
script:
- git clone --single-branch --branch sarek https://github.com/nf-core/test-datasets.git data
- nextflow run ${TRAVIS_BUILD_DIR}/build.nf -profile docker --genome smallGRCh37 --refdir data/reference --outdir references --publishDirMode link --max_memory 7.GB --max_cpus 2 -ansi-log false
- nextflow run ${TRAVIS_BUILD_DIR}/main.nf -profile docker --genome smallGRCh37 --sample data/testdata/tsv/tiny-manta.tsv --tools HaploTypeCaller,Manta,Strelka,MuTecT2,FreeBayes --igenomes_base references --publishDirMode link --max_memory 7.GB --max_cpus 2 -ansi-log false
- "${TRAVIS_BUILD_DIR}/bin/run_tests.sh --test $TEST"
29 changes: 23 additions & 6 deletions Jenkinsfile
Original file line number Diff line number Diff line change
Expand Up @@ -8,26 +8,43 @@ pipeline {
stages {
stage('Setup environment') {
steps {
sh "docker pull nfcore/sarek:dev"
sh "./bin/download_docker.sh -t ALL"
}
}
stage('Build') {
steps {
sh "rm -rf data"
sh "git clone --single-branch --branch sarek https://github.com/nf-core/test-datasets.git data"
sh "nextflow run build.nf -profile docker --genome smallGRCh37 --refdir data/reference --outdir references --publishDirMode link -ansi-log false"
sh "./bin/build_reference.sh --test ALL --build"
sh "rm -rf work/ references/pipeline_info .nextflow*"
}
}
stage('SampleDir') {
stage('Somatic') {
steps {
sh "nextflow run main.nf -profile docker --sampleDir data/testdata/tiny/normal --tools HaplotypeCaller,Manta,Strelka --genome smallGRCh37 --igenomes_base references --publishDirMode link -ansi-log false"
sh "./bin/run_tests.sh --test SOMATIC"
sh "rm -rf work/ .nextflow* results/"
}
}
stage('Germline') {
steps {
sh "./bin/run_tests.sh --test GERMLINE"
sh "rm -rf work/ .nextflow* results/"
}
}
stage('targeted') {
steps {
sh "./bin/run_tests.sh --test TARGETED"
sh "rm -rf work/ .nextflow* results/"
}
}
stage('Annotation') {
steps {
sh "./bin/run_tests.sh --test ANNOTATEALL"
sh "rm -rf work/ .nextflow* results/"
}
}
stage('Multiple') {
steps {
sh "nextflow run main.nf -profile docker --sample data/testdata/tsv/tiny-multiple.tsv --tools HaploTypeCaller,Manta,Strelka,MuTecT2,FreeBayes --genome smallGRCh37 --igenomes_base references --publishDirMode link -ansi-log false"
sh "./bin/run_tests.sh --test MULTIPLE"
sh "rm -rf work/ .nextflow* results/"
}
}
Expand Down
12 changes: 9 additions & 3 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -7,9 +7,11 @@
[![Nextflow version][nextflow-badge]](https://www.nextflow.io)
[![Travis build status][travis-badge]](https://travis-ci.org/nf-core/sarek)
[![CircleCi build status][circleci-badge]](https://circleci.com/gh/nf-core/workflows/sarek)

[![Install with bioconda][bioconda-badge]](http://bioconda.github.io/)
[![Docker Container available][docker-badge]](https://hub.docker.com/r/nfcore/sarek)
[![Docker Container available][docker-sarek-badge]](https://hub.docker.com/r/nfcore/sarek)
[![Install with Singularity][singularity-badge]](https://www.sylabs.io/docs/)

[![Join us on Slack][slack-badge]](https://nfcore.slack.com/messages/CGFUX04HZ/)

Expand Down Expand Up @@ -77,7 +79,7 @@ The worflow steps and tools used are as follows:
* [GATK ApplyBQSR](https://github.com/broadinstitute/gatk)
2. **Germline variant calling** - `germlineVC.nf`
* SNVs and small indels
* [GATK HaplotyeCaller](https://github.com/broadinstitute/gatk)
* [GATK HaplotypeCaller](https://github.com/broadinstitute/gatk)
* [Strelka2](https://github.com/Illumina/strelka)
* Structural variants
* [Manta](https://github.com/Illumina/manta)
Expand Down Expand Up @@ -139,10 +141,14 @@ For further information or help, don't hesitate to get in touch on [Slack](https

[bioconda-badge]: https://img.shields.io/badge/install%20with-bioconda-brightgreen.svg?logo=
[btb-link]: https://ki.se/forskning/barntumorbanken-0
[docker-badge]: https://img.shields.io/docker/automated/nfcore/sarek.svg?logo=docker
[circleci-badge]: https://img.shields.io/circleci/project/github/nf-core/sarek.svg?logo=circleci
[docker-sarek-badge]: https://img.shields.io/docker/automated/nfcore/sarek.svg?logo=docker
[docker-snpeff-badge]: https://img.shields.io/docker/automated/nfcore/sareksnpeff.svg?logo=docker
[docker-vep-badge]: https://img.shields.io/docker/automated/nfcore/sarekvep.svg?logo=docker
[nbis-link]: https://nbis.se
[nextflow-badge]: https://img.shields.io/badge/nextflow-%E2%89%A519.04.0-brightgreen.svg?logo=
[ngi-link]: https://ngisweden.scilifelab.se/
[scilifelab-link]: https://scilifelab.se
[singularity-badge]: https://img.shields.io/badge/use%20with-singularity-purple.svg
[slack-badge]: https://img.shields.io/badge/slack-nfcore/sarek-blue.svg?logo=slack
[travis-badge]: https://img.shields.io/travis/nf-core/sarek.svg?logo=travis
38 changes: 38 additions & 0 deletions bin/build_reference.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,38 @@
#!/bin/bash
set -xeuo pipefail

BUILD=false
TEST=ALL
TRAVIS_BUILD_DIR=${TRAVIS_BUILD_DIR:-.}
TRAVIS=${TRAVIS:-false}

while [[ $# -gt 0 ]]
do
key=$1
case $key in
-t|--test)
TEST=$2
shift # past argument
shift # past value
;;
-b|--build)
BUILD=true
shift # past value
;;
*) # unknown option
shift # past argument
;;
esac
done

# Always download test data
rm -rf data
git clone --single-branch --branch sarek https://github.com/nf-core/test-datasets.git data

# Build references for smallGRCh37
if [[ BUILD ]] && [[ $TEST != ANNOTATESNPEFF ]] && [[ $TEST != ANNOTATEVEP ]]
then
rm -rf references
nextflow run ${TRAVIS_BUILD_DIR}/build.nf -profile docker -ansi-log false --publishDirMode link --max_memory 7.GB --max_cpus 2 -dump-channels --genome smallGRCh37 --refdir data/reference --outdir references
rm -rf .nextflow* references/pipeline_info work
fi
32 changes: 32 additions & 0 deletions bin/download_docker.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,32 @@
#!/bin/bash
set -xeuo pipefail

TEST=ALL

while [[ $# -gt 0 ]]
do
key=$1
case $key in
-t|--test)
TEST=$2
shift # past argument
shift # past value
;;
*) # unknown option
shift # past argument
;;
esac
done

if [[ ALL,ANNOTATEALL,ANNOTATEVEP =~ $TEST ]]
then
docker pull nfcore/sarekvep:dev.GRCh37
docker tag nfcore/sarekvep:dev.GRCh37 nfcore/sarekvep:dev.smallGRCh37
elif [[ ALL,ANNOTATEALL,ANNOTATESNPEFF =~ $TEST ]]
then
docker pull nfcore/sareksnpeff:dev.GRCh37
docker tag nfcore/sareksnpeff:dev.GRCh37 nfcore/sareksnpeff:dev.smallGRCh37
else
docker pull nfcore/sarek:dev
docker tag nfcore/sarek:dev nfcore/sarek:dev
fi
66 changes: 66 additions & 0 deletions bin/run_tests.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,66 @@
#!/bin/bash
set -xeuo pipefail

CPUS=2
TEST=ALL
TRAVIS_BUILD_DIR=${TRAVIS_BUILD_DIR:-.}
TRAVIS=${TRAVIS:-false}

while [[ $# -gt 0 ]]
do
key=$1
case $key in
-t|--test)
TEST=$2
shift # past argument
shift # past value
;;
-c|--cpus)
CPUS=$2
shift # past value
;;
*) # unknown option
shift # past argument
;;
esac
done

function run_sarek() {
nextflow run ${TRAVIS_BUILD_DIR}/main.nf -profile docker -ansi-log false --publishDirMode link --max_memory 7.GB --max_cpus 2 -dump-channels --genome smallGRCh37 --igenomes_base references $@
}

if [[ ALL,GERMLINE =~ $TEST ]]
then
run_sarek --sample data/testdata/tiny/normal --tools HaplotypeCaller,Strelka --noReports
run_sarek --step recalibrate --noReports
fi

if [[ ALL,SOMATIC =~ $TEST ]]
then
run_sarek --sample data/testdata/tsv/tiny-manta.tsv --tools FreeBayes,HaplotypeCaller,Manta,Strelka,Mutect2 --noReports
fi

if [[ ALL,TARGETED =~ $TEST ]]
then
run_sarek --sample data/testdata/tsv/tiny-manta.tsv --tools FreeBayes,HaplotypeCaller,Manta,Strelka,Mutect2 --noReports --targetBED data/testdata/target.bed
fi

if [[ ALL,ANNOTATEALL,ANNOTATESNPEFF,ANNOTATEVEP =~ $TEST ]]
then
if [[ $TEST = ANNOTATESNPEFF ]]
then
ANNOTATOR=snpEFF
elif [[ $TEST = ANNOTATEVEP ]]
then
ANNOTATOR=VEP
elif [[ ALL,ANNOTATEALL =~ $TEST ]]
then
ANNOTATOR=merge,snpEFF,VEP
fi
run_sarek --step annotate --tools ${ANNOTATOR} --annotateVCF data/testdata/vcf/Strelka_1234N_variants.vcf.gz --noReports
fi

if [[ MULTIPLE =~ $TEST ]]
then
run_sarek --sample data/testdata/tsv/tiny-multiple.tsv --tools FreeBayes,HaplotypeCaller,Manta,Strelka,Mutect2 --noReports
fi
Loading

0 comments on commit 3c5f236

Please sign in to comment.