-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathfind-missing-snps-biobank.sh
executable file
·58 lines (51 loc) · 1.79 KB
/
find-missing-snps-biobank.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
#!/usr/bin/env bash
# Run imputation to find good guesses for the SNPs missing from 23andme
ALL_1000G_DIR=23andme-impute
TMP_DIR=impute-out
GEN_FILE=imputed-snps-biobank.gen
mkdir -p $OUT
rm -r $GEN_FILE
# rs689
impute2 -m $ALL_1000G_DIR/genetic_map_chr11_combined_b37.txt \
-h $ALL_1000G_DIR/ALL_1000G_phase1integrated_v3_chr11_impute.hap.gz \
-l $ALL_1000G_DIR/ALL_1000G_phase1integrated_v3_chr11_impute.legend.gz \
-g $ALL_1000G_DIR/imputed.chr11.gen \
-int 0e6 5e6 \
-Ne 20000 \
-o $TMP_DIR/tmp_impute2 \
-phase \
-allow_large_regions
grep 'rs689 ' $TMP_DIR/tmp_impute2 >> $GEN_FILE
# rs12722495
impute2 -m $ALL_1000G_DIR/genetic_map_chr10_combined_b37.txt \
-h $ALL_1000G_DIR/ALL_1000G_phase1integrated_v3_chr10_impute.hap.gz \
-l $ALL_1000G_DIR/ALL_1000G_phase1integrated_v3_chr10_impute.legend.gz \
-g $ALL_1000G_DIR/imputed.chr10.gen \
-int 5e6 10e6 \
-Ne 20000 \
-o $TMP_DIR/tmp_impute2 \
-phase \
-allow_large_regions
grep 'rs12722495 ' $TMP_DIR/tmp_impute2 >> $GEN_FILE
# rs17574546
impute2 -m $ALL_1000G_DIR/genetic_map_chr15_combined_b37.txt \
-h $ALL_1000G_DIR/ALL_1000G_phase1integrated_v3_chr15_impute.hap.gz \
-l $ALL_1000G_DIR/ALL_1000G_phase1integrated_v3_chr15_impute.legend.gz \
-g $ALL_1000G_DIR/imputed.chr15.gen \
-int 35e6 40e6 \
-Ne 20000 \
-o $TMP_DIR/tmp_impute2 \
-phase \
-allow_large_regions
grep 'rs17574546 ' $TMP_DIR/tmp_impute2 >> $GEN_FILE
# rs4948088
impute2 -m $ALL_1000G_DIR/genetic_map_chr7_combined_b37.txt \
-h $ALL_1000G_DIR/ALL_1000G_phase1integrated_v3_chr7_impute.hap.gz \
-l $ALL_1000G_DIR/ALL_1000G_phase1integrated_v3_chr7_impute.legend.gz \
-g $ALL_1000G_DIR/imputed.chr7.gen \
-int 50e6 55e6 \
-Ne 20000 \
-o $TMP_DIR/tmp_impute2 \
-phase \
-allow_large_regions
grep 'rs4948088 ' $TMP_DIR/tmp_impute2 >> $GEN_FILE