-
Notifications
You must be signed in to change notification settings - Fork 1
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge branch 'master' of github.com:klarman-cell-observatory/scrnaseq…
…_pipeline
- Loading branch information
Showing
9 changed files
with
2,283 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,52 @@ | ||
#!/bin/bash | ||
|
||
# | ||
# conda create -n dsub_env python=3 pip | ||
# conda activate dsub_env | ||
# pip install --upgrade dsub | ||
# conda install -c conda-forge google-cloud-sdk | ||
# gcloud auth configure-docker | ||
# | ||
|
||
# conda activate dsub_env | ||
|
||
dir_name="finngen_atac" | ||
gcp_bucket_basedir="gs://fc-secure-d4adbbf9-8265-4a5c-b14f-23a5f1b5c4f9/${dir_name}" | ||
sample_tracking_file="${gcp_bucket_basedir}/011124_pooled_atac_count_sampletracker.csv" | ||
project_name="finngen_atac" | ||
email="will@broadinstitute.org" | ||
workspace="'693-finland-v2f/Finngen'" | ||
count_matrix_name="raw_feature_bc_matrix.h5" | ||
steps="COUNT" | ||
mkfastq_memory="256G" | ||
mkfastq_diskspace="2500" | ||
cellranger_method="broadinstitute:cumulus:Cellranger:2.2.0" | ||
cumulus_method="broadinstitute:cumulus:cumulus:2.1.1" | ||
cellbender_method="cellbender/remove-background/11" | ||
cellranger_version="7.0.1" | ||
cellranger_atac_version="2.1.0" | ||
cellranger_arc_version="2.0.1" | ||
|
||
current_time=$(date "+%Y.%m.%d-%H.%M.%S") | ||
|
||
dsub --provider google-cls-v2 --project "microbiome-xavier" --regions us-east1 \ | ||
--service-account "scrnaseq-pipeline@microbiome-xavier.iam.gserviceaccount.com" \ | ||
--image "gcr.io/microbiome-xavier/conda-alto" --disk-size '10' --timeout '2d'\ | ||
--logging "$gcp_bucket_basedir/logs/" \ | ||
--command "wget https://github.com/will-broad/scrnaseq_pipeline/archive/atac.zip && unzip atac.zip && cd scrnaseq_pipeline-atac/src && python sc_pipeline.py" \ | ||
--output PIPELINE_LOGS="$gcp_bucket_basedir/logs/execution_$current_time.log" \ | ||
--input SAMPLE_TRACKING_FILE="$sample_tracking_file" \ | ||
--env PROJECT_NAME="$project_name" \ | ||
--env GCP_BUCKET_BASEDIR="$gcp_bucket_basedir" \ | ||
--env EMAIL="$email" \ | ||
--env TERRA_WORKSPACE="$workspace" \ | ||
--env COUNT_MATRIX_NAME="$count_matrix_name" \ | ||
--env STEPS="$steps" \ | ||
--env CELLRANGER_METHOD="$cellranger_method" \ | ||
--env CUMULUS_METHOD="$cumulus_method" \ | ||
--env CELLBENDER_METHOD="$cellbender_method" \ | ||
--env CELLRANGER_VERSION="$cellranger_version" \ | ||
--env CELLRANGER_ATAC_VERSION="$cellranger_atac_version" \ | ||
--env CELLRANGER_ARC_VERSION="$cellranger_arc_version" \ | ||
--env MKFASTQ_DISKSPACE="$mkfastq_diskspace" \ | ||
--env MKFASTQ_MEMORY="$mkfastq_memory" |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,53 @@ | ||
#!/bin/bash | ||
|
||
# | ||
# conda create -n dsub_env python=3 pip | ||
# conda activate dsub_env | ||
# pip install --upgrade dsub | ||
# conda install -c conda-forge google-cloud-sdk | ||
# gcloud auth configure-docker | ||
# | ||
|
||
# conda activate dsub_env | ||
|
||
dir_name="finngen_gex" | ||
gcp_bucket_basedir="gs://fc-secure-d4adbbf9-8265-4a5c-b14f-23a5f1b5c4f9/${dir_name}" | ||
sample_tracking_file="${gcp_bucket_basedir}/042424_batch4_gex_count_sampletracker.csv" | ||
project_name="finngen_gex" | ||
email="will@broadinstitute.org" | ||
workspace="'693-finland-v2f/Finngen'" | ||
count_matrix_name="raw_feature_bc_matrix.h5" | ||
steps="COUNT,CELLBENDER" | ||
mkfastq_memory="256G" | ||
mkfastq_diskspace="2500" | ||
cellranger_method="broadinstitute:cumulus:Cellranger:2.2.0" | ||
cumulus_method="broadinstitute:cumulus:cumulus:2.1.1" | ||
cellbender_method="cellbender/remove-background/13" | ||
cellranger_version="7.0.1" | ||
cellranger_atac_version="2.1.0" | ||
cellranger_arc_version="2.0.1" | ||
|
||
current_time=$(date "+%Y.%m.%d-%H.%M.%S") | ||
|
||
dsub --provider google-cls-v2 --project "microbiome-xavier" --regions us-east1 \ | ||
--service-account "scrnaseq-pipeline@microbiome-xavier.iam.gserviceaccount.com" \ | ||
--image "gcr.io/microbiome-xavier/conda-alto" --disk-size '10' --boot-disk-size '30' --timeout '2d'\ | ||
--logging "$gcp_bucket_basedir/logs/" \ | ||
--machine-type 'n1-standard-16' \ | ||
--command "wget https://github.com/will-broad/scrnaseq_pipeline/archive/gex.zip && unzip gex.zip && cd scrnaseq_pipeline-gex/src && python sc_pipeline.py" \ | ||
--output PIPELINE_LOGS="$gcp_bucket_basedir/logs/execution_$current_time.log" \ | ||
--input SAMPLE_TRACKING_FILE="$sample_tracking_file" \ | ||
--env PROJECT_NAME="$project_name" \ | ||
--env GCP_BUCKET_BASEDIR="$gcp_bucket_basedir" \ | ||
--env EMAIL="$email" \ | ||
--env TERRA_WORKSPACE="$workspace" \ | ||
--env COUNT_MATRIX_NAME="$count_matrix_name" \ | ||
--env STEPS="$steps" \ | ||
--env CELLRANGER_METHOD="$cellranger_method" \ | ||
--env CUMULUS_METHOD="$cumulus_method" \ | ||
--env CELLBENDER_METHOD="$cellbender_method" \ | ||
--env CELLRANGER_VERSION="$cellranger_version" \ | ||
--env CELLRANGER_ATAC_VERSION="$cellranger_atac_version" \ | ||
--env CELLRANGER_ARC_VERSION="$cellranger_arc_version" \ | ||
--env MKFASTQ_DISKSPACE="$mkfastq_diskspace" \ | ||
--env MKFASTQ_MEMORY="$mkfastq_memory" |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,53 @@ | ||
#!/bin/bash | ||
|
||
# | ||
# conda create -n dsub_env python=3 pip | ||
# conda activate dsub_env | ||
# pip install --upgrade dsub | ||
# conda install -c conda-forge google-cloud-sdk | ||
# gcloud auth configure-docker | ||
# | ||
|
||
# conda activate dsubenv | ||
|
||
dir_name="finngen_multiome" | ||
gcp_bucket_basedir="gs://fc-secure-d4adbbf9-8265-4a5c-b14f-23a5f1b5c4f9/${dir_name}" | ||
sample_tracking_file="${gcp_bucket_basedir}/042624_batch4_multiome_count_sampletracker.csv" | ||
project_name="finngen_multiome" | ||
email="will@broadinstitute.org" | ||
workspace="'693-finland-v2f/Finngen'" | ||
count_matrix_name="raw_feature_bc_matrix.h5" | ||
steps="COUNT" | ||
mkfastq_memory="256G" | ||
mkfastq_diskspace="3000" | ||
cellranger_method="broadinstitute:cumulus:Cellranger:2.2.0" | ||
cumulus_method="broadinstitute:cumulus:cumulus:2.1.1" | ||
cellbender_method="cellbender/remove-background/11" | ||
cellranger_version="7.0.1" | ||
cellranger_atac_version="2.1.0" | ||
cellranger_arc_version="2.0.2.custom-max-cell" | ||
|
||
current_time=$(date "+%Y.%m.%d-%H.%M.%S") | ||
|
||
dsub --provider google-cls-v2 --project "microbiome-xavier" --regions us-east1 \ | ||
--service-account "scrnaseq-pipeline@microbiome-xavier.iam.gserviceaccount.com" \ | ||
--image "gcr.io/microbiome-xavier/conda-alto" --disk-size '10' --boot-disk-size '30' --timeout '2d'\ | ||
--machine-type 'n1-standard-4' \ | ||
--logging "$gcp_bucket_basedir/logs/" \ | ||
--command "wget https://github.com/will-broad/scrnaseq_pipeline/archive/multiome_maxcell.zip && unzip multiome_maxcell.zip && cd scrnaseq_pipeline-multiome_maxcell/src && python sc_pipeline.py" \ | ||
--output PIPELINE_LOGS="$gcp_bucket_basedir/logs/execution_$current_time.log" \ | ||
--input SAMPLE_TRACKING_FILE="$sample_tracking_file" \ | ||
--env PROJECT_NAME="$project_name" \ | ||
--env GCP_BUCKET_BASEDIR="$gcp_bucket_basedir" \ | ||
--env EMAIL="$email" \ | ||
--env TERRA_WORKSPACE="$workspace" \ | ||
--env COUNT_MATRIX_NAME="$count_matrix_name" \ | ||
--env STEPS="$steps" \ | ||
--env CELLRANGER_METHOD="$cellranger_method" \ | ||
--env CUMULUS_METHOD="$cumulus_method" \ | ||
--env CELLBENDER_METHOD="$cellbender_method" \ | ||
--env CELLRANGER_VERSION="$cellranger_version" \ | ||
--env CELLRANGER_ATAC_VERSION="$cellranger_atac_version" \ | ||
--env CELLRANGER_ARC_VERSION="$cellranger_arc_version" \ | ||
--env MKFASTQ_DISKSPACE="$mkfastq_diskspace" \ | ||
--env MKFASTQ_MEMORY="$mkfastq_memory" |
Oops, something went wrong.