Skip to content

Commit

Permalink
use mosue data instead
Browse files Browse the repository at this point in the history
  • Loading branch information
Moustafa Shokrof committed Jul 14, 2022
1 parent 4534341 commit 2e4ab3e
Show file tree
Hide file tree
Showing 3 changed files with 126 additions and 22 deletions.
59 changes: 56 additions & 3 deletions usecases/kDifferentialExpression/downloadData.sh
Original file line number Diff line number Diff line change
@@ -1,5 +1,58 @@
mkdir -p inputData
cd inputData
wget http://genomedata.org/rnaseq-tutorial/HBR_UHR_ERCC_ds_5pc.tar
tar -xvf HBR_UHR_ERCC_ds_5pc.tar
wget http://genomedata.org/rnaseq-tutorial/fasta/GRCh38/chr22_with_ERCC92.fa
#!/usr/bin/env bash
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252175/DRR252175_1.fastq.gz -o DRR252175_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253462_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252175/DRR252175_2.fastq.gz -o DRR252175_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253462_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252176/DRR252176_1.fastq.gz -o DRR252176_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253463_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252176/DRR252176_2.fastq.gz -o DRR252176_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253463_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252174/DRR252174_1.fastq.gz -o DRR252174_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253461_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252174/DRR252174_2.fastq.gz -o DRR252174_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253461_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252177/DRR252177_1.fastq.gz -o DRR252177_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253464_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252177/DRR252177_2.fastq.gz -o DRR252177_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253464_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252178/DRR252178_1.fastq.gz -o DRR252178_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253465_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252178/DRR252178_2.fastq.gz -o DRR252178_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253465_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252179/DRR252179_1.fastq.gz -o DRR252179_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253466_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252179/DRR252179_2.fastq.gz -o DRR252179_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253466_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252181/DRR252181_1.fastq.gz -o DRR252181_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253468_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252181/DRR252181_2.fastq.gz -o DRR252181_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253468_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252183/DRR252183_1.fastq.gz -o DRR252183_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253470_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252183/DRR252183_2.fastq.gz -o DRR252183_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253470_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252180/DRR252180_1.fastq.gz -o DRR252180_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253467_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252180/DRR252180_2.fastq.gz -o DRR252180_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253467_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252182/DRR252182_1.fastq.gz -o DRR252182_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253469_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252182/DRR252182_2.fastq.gz -o DRR252182_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253469_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252184/DRR252184_1.fastq.gz -o DRR252184_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253471_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252184/DRR252184_2.fastq.gz -o DRR252184_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253471_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252185/DRR252185_1.fastq.gz -o DRR252185_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253472_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252185/DRR252185_2.fastq.gz -o DRR252185_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253472_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252187/DRR252187_1.fastq.gz -o DRR252187_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253474_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252187/DRR252187_2.fastq.gz -o DRR252187_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253474_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252188/DRR252188_1.fastq.gz -o DRR252188_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253475_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252188/DRR252188_2.fastq.gz -o DRR252188_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253475_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252190/DRR252190_1.fastq.gz -o DRR252190_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253477_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252190/DRR252190_2.fastq.gz -o DRR252190_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253477_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252191/DRR252191_1.fastq.gz -o DRR252191_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253478_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252191/DRR252191_2.fastq.gz -o DRR252191_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253478_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252186/DRR252186_1.fastq.gz -o DRR252186_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253473_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252186/DRR252186_2.fastq.gz -o DRR252186_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253473_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252189/DRR252189_1.fastq.gz -o DRR252189_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253476_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252189/DRR252189_2.fastq.gz -o DRR252189_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253476_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252192/DRR252192_1.fastq.gz -o DRR252192_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253479_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252192/DRR252192_2.fastq.gz -o DRR252192_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253479_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252193/DRR252193_1.fastq.gz -o DRR252193_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253480_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252193/DRR252193_2.fastq.gz -o DRR252193_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253480_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252194/DRR252194_1.fastq.gz -o DRR252194_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253481_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252194/DRR252194_2.fastq.gz -o DRR252194_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253481_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252195/DRR252195_1.fastq.gz -o DRR252195_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253482_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252195/DRR252195_2.fastq.gz -o DRR252195_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253482_2.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252196/DRR252196_1.fastq.gz -o DRR252196_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253483_1.fastq.gz
curl -L ftp://ftp.sra.ebi.ac.uk/vol1/fastq/DRR252/DRR252196/DRR252196_2.fastq.gz -o DRR252196_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253483_2.fastq.gz


#wget https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/001/635/GCF_000001635.27_GRCm39/GCF_000001635.27_GRCm39_genomic.fna.gz

wget https://hgdownload.soe.ucsc.edu/goldenPath/mm39/bigZips/mrna.fa.gz

gzip -d mrna.fa.gz

#wget http://genomedata.org/rnaseq-tutorial/fasta/GRCh38/chr22_with_ERCC92.fa
29 changes: 23 additions & 6 deletions usecases/kDifferentialExpression/sample_table.csv
Original file line number Diff line number Diff line change
@@ -1,8 +1,25 @@
sample_name,library
ERCC92,transpictome
HBR_REP1,sample
HBR_REP2,sample
HBR_REP3,sample
UHR_REP1,control
UHR_REP2,control
UHR_REP3,control
SAMD00253483,control
SAMD00253482,control
SAMD00253481,control
SAMD00253480,control
SAMD00253479,control
SAMD00253478,control
SAMD00253477,control
SAMD00253476,control
SAMD00253475,control
SAMD00253474,control
SAMD00253473,control
SAMD00253472,control
SAMD00253471,sample
SAMD00253470,sample
SAMD00253469,sample
SAMD00253468,sample
SAMD00253467,sample
SAMD00253466,sample
SAMD00253465,sample
SAMD00253464,sample
SAMD00253463,sample
SAMD00253462,sample
SAMD00253461,sample
60 changes: 47 additions & 13 deletions usecases/kDifferentialExpression/subsample_table.csv
Original file line number Diff line number Diff line change
@@ -1,14 +1,48 @@
sample_name,file
ERCC92,inputData/genesERCC.fa
HBR_REP1,inputData/HBR_Rep1_ERCC-Mix2_Build37-ErccTranscripts-chr22.read1.fastq.gz
HBR_REP1,inputData/HBR_Rep1_ERCC-Mix2_Build37-ErccTranscripts-chr22.read2.fastq.gz
HBR_REP2,inputData/HBR_Rep2_ERCC-Mix2_Build37-ErccTranscripts-chr22.read1.fastq.gz
HBR_REP2,inputData/HBR_Rep2_ERCC-Mix2_Build37-ErccTranscripts-chr22.read2.fastq.gz
HBR_REP3,inputData/HBR_Rep3_ERCC-Mix2_Build37-ErccTranscripts-chr22.read1.fastq.gz
HBR_REP3,inputData/HBR_Rep3_ERCC-Mix2_Build37-ErccTranscripts-chr22.read2.fastq.gz
UHR_REP1,inputData/UHR_Rep1_ERCC-Mix1_Build37-ErccTranscripts-chr22.read1.fastq.gz
UHR_REP1,inputData/UHR_Rep1_ERCC-Mix1_Build37-ErccTranscripts-chr22.read2.fastq.gz
UHR_REP2,inputData/UHR_Rep2_ERCC-Mix1_Build37-ErccTranscripts-chr22.read1.fastq.gz
UHR_REP2,inputData/UHR_Rep2_ERCC-Mix1_Build37-ErccTranscripts-chr22.read2.fastq.gz
UHR_REP3,inputData/UHR_Rep3_ERCC-Mix1_Build37-ErccTranscripts-chr22.read1.fastq.gz
UHR_REP3,inputData/UHR_Rep3_ERCC-Mix1_Build37-ErccTranscripts-chr22.read2.fastq.gz
ERCC92,inputData/mrna.
SAMD00253461,inputData/DRR252174_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253461_1.fastq.gz
SAMD00253468,inputData/DRR252181_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253468_1.fastq.gz
SAMD00253462,inputData/DRR252175_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253462_1.fastq.gz
SAMD00253477,inputData/DRR252190_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253477_2.fastq.gz
SAMD00253464,inputData/DRR252177_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253464_1.fastq.gz
SAMD00253472,inputData/DRR252185_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253472_1.fastq.gz
SAMD00253471,inputData/DRR252184_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253471_1.fastq.gz
SAMD00253467,inputData/DRR252180_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253467_1.fastq.gz
SAMD00253478,inputData/DRR252191_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253478_2.fastq.gz
SAMD00253482,inputData/DRR252195_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253482_1.fastq.gz
SAMD00253474,inputData/DRR252187_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253474_1.fastq.gz
SAMD00253481,inputData/DRR252194_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253481_1.fastq.gz
SAMD00253480,inputData/DRR252193_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253480_2.fastq.gz
SAMD00253475,inputData/DRR252188_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253475_2.fastq.gz
SAMD00253476,inputData/DRR252189_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253476_2.fastq.gz
SAMD00253483,inputData/DRR252196_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253483_2.fastq.gz
SAMD00253479,inputData/DRR252192_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253479_1.fastq.gz
SAMD00253470,inputData/DRR252183_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253470_2.fastq.gz
SAMD00253473,inputData/DRR252186_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253473_2.fastq.gz
SAMD00253466,inputData/DRR252179_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253466_2.fastq.gz
SAMD00253465,inputData/DRR252178_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253465_2.fastq.gz
SAMD00253463,inputData/DRR252176_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253463_2.fastq.gz
SAMD00253469,inputData/DRR252182_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253469_2.fastq.gz
SAMD00253469,inputData/DRR252182_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253469_1.fastq.gz
SAMD00253463,inputData/DRR252176_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253463_1.fastq.gz
SAMD00253466,inputData/DRR252179_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253466_1.fastq.gz
SAMD00253465,inputData/DRR252178_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253465_1.fastq.gz
SAMD00253470,inputData/DRR252183_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253470_1.fastq.gz
SAMD00253473,inputData/DRR252186_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253473_1.fastq.gz
SAMD00253480,inputData/DRR252193_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253480_1.fastq.gz
SAMD00253475,inputData/DRR252188_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253475_1.fastq.gz
SAMD00253483,inputData/DRR252196_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253483_1.fastq.gz
SAMD00253479,inputData/DRR252192_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253479_2.fastq.gz
SAMD00253476,inputData/DRR252189_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253476_1.fastq.gz
SAMD00253474,inputData/DRR252187_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253474_2.fastq.gz
SAMD00253478,inputData/DRR252191_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253478_1.fastq.gz
SAMD00253482,inputData/DRR252195_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253482_2.fastq.gz
SAMD00253481,inputData/DRR252194_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253481_2.fastq.gz
SAMD00253472,inputData/DRR252185_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253472_2.fastq.gz
SAMD00253467,inputData/DRR252180_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253467_2.fastq.gz
SAMD00253471,inputData/DRR252184_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253471_2.fastq.gz
SAMD00253477,inputData/DRR252190_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253477_1.fastq.gz
SAMD00253464,inputData/DRR252177_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253464_2.fastq.gz
SAMD00253461,inputData/DRR252174_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253461_2.fastq.gz
SAMD00253462,inputData/DRR252175_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253462_2.fastq.gz
SAMD00253468,inputData/DRR252181_Illumina_HiSeq_2500_paired_end_sequencing_of_SAMD00253468_2.fastq.gz

0 comments on commit 2e4ab3e

Please sign in to comment.