-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathfosmids.R
82 lines (63 loc) · 2.91 KB
/
fosmids.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
#!/usr/bin/env Rscript
setwd(dirname(rstudioapi::getActiveDocumentContext()$path))
#source("plotutils.R")
tested_sds = readbed("data/misc_files/probe.mappings.bed.gz", "sds")
probe = c("174222_ABC10_2_1_000044559800_C15","174222_ABC10_2_1_000044587300_G6","171417_ABC10_2_1_000045520200_K20")
#tested_sds=tested_sds[probe_id %in% probe]
n =length(unique(tested_sds$probe_id))
#
# read in fes results
#
results = fread("data/misc_files/results.csv.gz")
results = melt(results, id.vars =c("sample", "CLONES"))
results$loc = gsub("\\(het\\)", "", results$value)
results$chr = results$variable
results= results[!is.na(results$loc)]
results=results[loc !="" ]
results
cens = CYTO[CYTO$gieStain == "gpos100"]
pcen = resize(cens, 5000000, fix="end")
qcen = resize(cens, 5000000, fix="start")
a = DataFrame(chr = as.character(seqnames(pcen)), start = start(ranges(pcen)), end = end(ranges(pcen)) ); a$loc = "pcen"
b = DataFrame(chr = as.character(seqnames(qcen)), start = start(ranges(qcen)), end = end(ranges(qcen)) ); b$loc = "qcen"
c = DataFrame(chr = FAI$chr, start = FAI$chrlen-5000000, end = FAI$chrlen); c$loc = "qter"
d = DataFrame(chr = as.character(seqnames(qcen)), start = 0, end = 5000000); d$loc = "pter"
e = DataFrame(chr=("chr4"), start = c(75300001), end = c(87100000), loc = "q21")
f = DataFrame(chr = as.character(seqnames(qcen)), start = start(ranges(qcen)), end = end(ranges(qcen)) ); f$loc = "qpcen"
convert_results = as.data.table(rbind(a,b,c,d,e,f))
fish_results = merge(results, convert_results, by = c("chr", "loc"))
fish_results= fish_results[chr %in% NOM]
fish_results <- as.data.table(merge(as.data.frame(fish_results),
data.table(color=brewer.pal(length(unique(fish_results$sample)), "Set3"),
sample = unique(fish_results$sample))))
gr_fish = toGRanges(data.table(fish_results$chr, fish_results$start, fish_results$end))
#
# show only the tested probes
#
all = tested_sds[tested_sds$probe_id %in% fish_results$CLONES]
probe = unique(all$probe_id)
n=length(probe)
#
# plot results
#
myplots <- vector('list', n)
for(i in seq(n)){
df <- all[probe_id==probe[i]]
df2 <- fish_results[CLONES==probe[i]]
chromosomes <- CHRS[ CHRS %in% df$chr | CHRS %in% df2$chr ]
#df <- df[df$end-df$start > 9999]
myplots[[i]] = as.ggplot(expression(
kp <- plotKaryotype(genome = GENOME, cytobands = CYTO, chromosomes = chromosomes, plot.type = 2),
kpAddMainTitle(kp, main=probe[i]),
kpPlotRegions(kp, data = reduce(toGRanges(data.table(chr = as.character(df$chr), start = df$start, end=df$end))+1000000),
col = NEWCOLOR),
kpPlotRegions(kp, data = toGRanges(data.table(chr = as.character(df2$chr), start = df2$start, end=df2$end))+5000000,
col = df2$color, border = df2$color, data.panel = 2)
))
}
myplots[[1]]
pdf("~/Desktop/fosmid.pdf", height = 4, width = 16)
for(i in seq(n)){
print(myplots[[i]])
}
dev.off()