1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66
|
\name{readGEOAnn}
\alias{readGEOAnn}
\alias{readIDNAcc}
\alias{getGPLNames}
\alias{getSAGEFileInfo}
\alias{getSAGEGPL}
\alias{readUrl}
\title{Function to extract data from the GEO web site}
\description{
Data files that are available at GEO web site are identified by GEO
accession numbers. Given the url for the CGI script at GEO and
a GEO accession number, the functions extract data from the web site
and returns a matrix containing the data.
}
\usage{
readGEOAnn(GEOAccNum, url = "https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?")
readIDNAcc(GEOAccNum, url = "https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?")
getGPLNames(url ="https://www.ncbi.nlm.nih.gov/geo/query/browse.cgi?")
getSAGEFileInfo(url =
"https://www.ncbi.nlm.nih.gov/geo/query/browse.cgi?view=platforms&prtype=SAGE&dtype=SAGE")
getSAGEGPL(organism = "Homo sapiens", enzyme = c("NlaIII", "Sau3A"))
readUrl(url)
}
\arguments{
\item{url}{\code{url} the url for the CGI script at GEO}
\item{GEOAccNum}{\code{GEOAccNum} a character string for the GEO
accession number of a desired file (e. g. GPL97)}
\item{organism}{\code{organism} a character string for the name of the
organism of interests}
\item{enzyme}{\code{enzyme} a character string that can be eighter
NlaII or Sau3A for the enzyme used to create SAGE tags}
}
\details{
\code{url} is the CGI script that processes user's
request. \code{\link{readGEOAnn}} invokes the CGI by passing a GEO
accession number and then processes the data file obtained.
\code{\link{readIDNAcc}} calls \code{\link{readGEOAnn}} to read the
data and the extracts the columns for probe ids and accession numbers.
The \code{GEOAccNum} has to be the id for an Affymetrix chip.
\code{\link{getGPLNames}} parses the html file that lists GEO
accession numbers and descriptions of the array represented by the
corresponding GEO accession numbers.
}
\value{
Both \code{\link{readGEOAnn}} and \code{\link{readIDNAcc}} return a
matrix.
\code{\link{getGPLNames}} returns a named vector of the names of
commercial arrays. The names of the vector are the corresponding GEO
accession number.
}
\references{\url{www.ncbi.nlm.nih.gov/geo}}
\author{Jianhua Zhang}
\examples{
# Get array names and GEO accession numbers
#geoAccNums <- getGPLNames()
# Read the annotation data file for HG-U133A which is GPL96 based on
# examining geoAccNums
#temp <- readGEOAnn(GEOAccNum = "GPL96")
#temp2 <- readIDNAcc(GEOAccNum = "GPL96")
}
\keyword{manip}
|