-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathfind_mito.R
34 lines (27 loc) · 1.07 KB
/
find_mito.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
library(tidyverse)
library(Biostrings)
library(RColorBrewer)
library(BSgenome)
library(GenomicRanges)
source('prolificans_asm_functions.R')
datadir='/pym/Data/Nanopore/projects/prolificans'
dbxdir='~/Dropbox/timplab_data/prolificans'
strains=c('st31', 'st90853', 'st5317')
teloinfofile=file.path(dbxdir, 'telo_info.csv')
alltelos=read_csv(teloinfofile, col_types=cols())
##trim mitos
for (i in strains) {
genomedir=file.path(datadir, i, 'genomes_covfilt')
prefixes=sub('\\.covfilt.fasta$', '', list.files(genomedir, '.covfilt.fasta$'))
newgenomedir=file.path(datadir, i, 'genomes_mitotrim')
system(paste0('mkdir -p ', newgenomedir))
for (asmname in prefixes) {
coordsfile=file.path(datadir, i, 'mummer_mito', paste0(asmname, '.mcoords'))
asmtiginfo=alltelos %>%
filter(asm==asmname)
asmfile=file.path(genomedir, paste0(asmname, '.covfilt.fasta'))
outfile=file.path(newgenomedir, paste0(asmname, '.mitotrim.fasta'))
print(asmname)
suggest_mito_breaks(coordsfile, asmtiginfo, asmfile, outfile)
}
}