File: supportedGeneIDs.R

package info (click to toggle)
r-bioc-genelendatabase 1.26.0-1
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 103,600 kB
  • sloc: makefile: 2
file content (27 lines) | stat: -rw-r--r-- 1,208 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
supportedGeneIDs=function(){
	base=unfactor(GenomicFeatures:::supportedUCSCtables())

	#Current version
	txname2gene_mapinfo=GenomicFeatures:::.UCSC_TXNAME2GENEID_MAPDEFS
	base$GeneID=""

	#Old version
	#tmp=unlist(lapply(txname2gene_mapinfo[base$db],function(u){u[[2]]}))
	#base$GeneID[match(names(tmp),base$db)]=as.character(tmp)

	#NEW Ant 28/09/16
	tmp=unlist(lapply(txname2gene_mapinfo[base$tablename],function(u){u[[2]]}))
	base$GeneID[match(names(tmp),base$tablename)]=as.character(tmp)

	#Add in gene symbol
	base[nrow(base)+1,]=c("geneSymbol",'refGene','refFlat',"Gene Symbol")
	base$AvailableGenomes=""
	repo=grep(".*\\..*\\.LENGTH",as.data.frame(data(package="geneLenDataBase")$results,stringsAsFactors=FALSE)$Item,ignore.case=TRUE,value=TRUE)
	repo=matrix(unlist(strsplit(repo,"\\.")),ncol=3,byrow=TRUE)
	valid_genomes=sapply(split(repo[,1],repo[,2]),paste,collapse=",")
	valid_genomes=valid_genomes[which(names(valid_genomes)%in%base$tablename)]
	base$AvailableGenomes[match(names(valid_genomes),base$tablename)]=as.character(valid_genomes)
  
  avail = base[base$tablename == "knownGene" | base$tablename == "vegaGene" | base$tablename == "geneSymbol" | base$tablename == "ensGene",]
  avail
}