File: prepareData.R

package info (click to toggle)
r-bioc-cner 1.26.0%2Bdfsg-1
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 18,216 kB
  • sloc: ansic: 23,458; makefile: 6
file content (68 lines) | stat: -rw-r--r-- 3,540 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
library(CNEr)
library(rtracklayer)
library(GenomicRanges)
# Prepare the Axt alignments for the regions of barhl2 and sox14
## hg38 vs danRer10
axtFnHg38DanRer10 <- "/Users/gtan/Repos/github/CNEr/inst/extdata/hg38.danRer10.net.axt"
axtFnDanRer10Hg38 <- "/Users/gtan/Repos/github/CNEr/inst/extdata/danRer10.hg38.net.axt"
axtHg38DanRer10 <- readAxt(axtFnHg38DanRer10)
axtDanRer10Hg38 <- readAxt(axtFnDanRer10Hg38)
qSize <- fetchChromSizes("hg38")
qSize <- seqlengths(qSize["chr6"])
## subAxt
danRer10.hg38.net.axt <- subAxt(axtDanRer10Hg38, chr="chr6", 
                                start=24000000, end=27000000, select="target")
writeAxt(danRer10.hg38.net.axt, "~/danRer10.hg38.net.axt")
hg38.danRer10.net.axt <- subAxt(axtHg38DanRer10, chr="chr6", 
                                start=24000000, end=27000000, select="query", qSize)
writeAxt(hg38.danRer10.net.axt, "~/hg38.danRer10.net.axt")

# Prepare the filter bed files for the regions of barhl2 and sox14
hg38Filter <- readBed("/Users/gtan/Repos/github/CNEr/inst/extdata/filter_regions.hg38.bed")
danRer10Filter <- readBed("/Users/gtan/Repos/github/CNEr/inst/extdata/filter_regions.danRer10.bed")
hits <- findOverlaps(hg38Filter, reduce(c(targetRanges(hg38.danRer10.net.axt),
                                          queryRanges(danRer10.hg38.net.axt))),
                     ignore.strand=TRUE)
hg38Filter <- hg38Filter[unique(queryHits(hits))]
danRer10Filter <- danRer10Filter[seqnames(danRer10Filter) == "chr6" &
                                 start(danRer10Filter) >= 24000000 & 
                                 end(danRer10Filter) <= 27000000]
export.bed(hg38Filter, con="~/filter_regions.hg38.bed")
export.bed(danRer10Filter, con="~/filter_regions.danRer10.bed")

# Prepare the CNE data 
axtFnHg38DanRer10 <- file.path(system.file("extdata", package="CNEr"), 
                               "hg38.danRer10.net.axt")
axtHg38DanRer10 <- readAxt(axtFnHg38DanRer10)
axtFnDanRer10Hg38 <- file.path(system.file("extdata", package="CNEr"), 
                               "danRer10.hg38.net.axt")
axtDanRer10Hg38 <- readAxt(axtFnDanRer10Hg38)
bedHg38Fn <- file.path(system.file("extdata", package="CNEr"), 
                       "filter_regions.hg38.bed")
bedHg38 <- readBed(bedHg38Fn)
bedDanRer10Fn <- file.path(system.file("extdata", package="CNEr"), 
                           "filter_regions.danRer10.bed")
bedDanRer10 <- readBed(bedDanRer10Fn)
qSizesHg38 <- fetchChromSizes("hg38")
qSizesDanRer10 <- fetchChromSizes("danRer10")
CNEHg38DanRer10 <- ceScan(x=axtHg38DanRer10, tFilter=bedHg38,
                          qFilter=bedDanRer10, tSizes=qSizesHg38,
                          qSizes=qSizesDanRer10,
                          window=c(50,50,50), identity=c(45, 48, 49))
save(CNEHg38DanRer10, file="~/CNEHg38DanRer10.rda")
CNEDanRer10Hg38 <- ceScan(x=axtDanRer10Hg38, tFilter=bedDanRer10,
                          qFilter=bedHg38, tSizes=qSizesDanRer10,
                          qSizes=qSizesHg38,
                          window=c(50,50,50), identity=c(45, 48, 49))
save(CNEDanRer10Hg38, file="~/CNEDanRer10Hg38.rda")

## Prepare danRer10CNE.sqlite
library(CNEr)
cneFns <- file.path("~/Downloads",
                    c("cne2wBf_AstMex102_danRer10_48_50",
                      "cne2wBf_cteIde1_danRer10_75_75",
                      "cne2wBf_danRer10_hg38_21_30",
                      "cne2wBf_danRer10_hg38_45_50",
                      "cne2wBf_danRer10_hg38_49_50"))
dbName <- "danRer10CNE.sqlite"
readAncoraIntoSQLite(cneFns, dbName=dbName, overwrite=FALSE)