DESCRIPTION | 13 +++++
NAMESPACE | 14 ++++++
R/zzz.R | 37 ++++++++++++++
debian/README.test | 5 --
debian/changelog | 13 -----
debian/compat | 1 -
debian/control | 25 ---------
debian/copyright | 134 -------------------------------------------------
debian/rules | 4 --
debian/source/format | 1 -
debian/watch | 3 --
inst/extdata/GO.sqlite | Bin 0 -> 97032192 bytes
man/GOBASE.Rd | 35 +++++++++++++
man/GOBPANCESTOR.Rd | 54 ++++++++++++++++++++
man/GOBPCHILDREN.Rd | 61 ++++++++++++++++++++++
man/GOBPOFFSPRING.Rd | 55 ++++++++++++++++++++
man/GOBPPARENTS.Rd | 66 ++++++++++++++++++++++++
man/GOCCANCESTOR.Rd | 54 ++++++++++++++++++++
man/GOCCCHILDREN.Rd | 60 ++++++++++++++++++++++
man/GOCCOFFSPRING.Rd | 54 ++++++++++++++++++++
man/GOCCPARENTS.Rd | 64 +++++++++++++++++++++++
man/GOMAPCOUNTS.Rd | 51 +++++++++++++++++++
man/GOMFANCESTOR.Rd | 55 ++++++++++++++++++++
man/GOMFCHILDREN.Rd | 60 ++++++++++++++++++++++
man/GOMFOFFSPRING.Rd | 54 ++++++++++++++++++++
man/GOMFPARENTS.Rd | 66 ++++++++++++++++++++++++
man/GOOBSOLETE.Rd | 44 ++++++++++++++++
man/GOSYNONYM.Rd | 34 +++++++++++++
man/GOTERM.Rd | 60 ++++++++++++++++++++++
man/GO_dbconn.Rd | 87 ++++++++++++++++++++++++++++++++
30 files changed, 1078 insertions(+), 186 deletions(-)
--- /dev/null
@@ -0,0 +1,13 @@
+Package: GO.db
+Title: A set of annotation maps describing the entire Gene Ontology
+Description: A set of annotation maps describing the entire Gene Ontology assembled using data from GO
+Version: 3.4.0
+Author: Marc Carlson
+Maintainer: Bioconductor Package Maintainer <maintainer at bioconductor.org>
+Depends: R (>= 2.7.0), methods, AnnotationDbi (>= 1.35.4)
+Imports: methods, AnnotationDbi
+Suggests: DBI
+License: Artistic-2.0
+biocViews: AnnotationData, FunctionalAnnotation
+NeedsCompilation: no
+Packaged: 2016-10-02 21:51:35 UTC; root
--- /dev/null
@@ -0,0 +1,14 @@
+### Only put what is statically exported here. All the AnnObj instances
+### created at load time are dynamically exported (refer to R/zzz.R for
+### the details).
+ GO,
+ GO_dbconn,
+ GO_dbfile,
+ GO_dbschema,
+ GO_dbInfo
@@ -0,0 +1,37 @@
+datacache <- new.env(hash=TRUE, parent=emptyenv())
+GO <- function() showQCData("GO", datacache)
+GO_dbconn <- function() dbconn(datacache)
+GO_dbfile <- function() dbfile(datacache)
+GO_dbschema <- function(file="", show.indices=FALSE) dbschema(datacache, file=file, show.indices=show.indices)
+GO_dbInfo <- function() dbInfo(datacache)
+.onLoad <- function(libname, pkgname)
+ ## Connect to the SQLite DB
+ dbfile <- system.file("extdata", "GO.sqlite", package=pkgname, lib.loc=libname)
+ assign("dbfile", dbfile, envir=datacache)
+ dbconn <- dbFileConnect(dbfile)
+ assign("dbconn", dbconn, envir=datacache)
+ ## Create the OrgDb object
+ sPkgname <- sub(".db$","",pkgname)
+ txdb <- loadDb(system.file("extdata", paste(sPkgname,
+ ".sqlite",sep=""), package=pkgname, lib.loc=libname),
+ packageName=pkgname)
+ dbNewname <- AnnotationDbi:::dbObjectName(pkgname,"GODb")
+ ns <- asNamespace(pkgname)
+ assign(dbNewname, txdb, envir=ns)
+ namespaceExport(ns, dbNewname)
+ ## Create the AnnObj instances
+ ann_objs <- createAnnObjs.SchemaChoice("GO_DB", "GO", "GO", dbconn, datacache)
+ mergeToNamespaceAndExport(ann_objs, pkgname)
+ packageStartupMessage(AnnotationDbi:::annoStartupMessages("GO.db"))
+.onUnload <- function(libpath)
+ dbFileDisconnect(GO_dbconn())
@@ -1,5 +0,0 @@
-Notes on how this package can be tested.
-This package can be tested by loading it into R with the command
-‘library(GO.db)’ in order to confirm its integrity.
deleted file mode 100644
index ec63514..0000000
--- a/debian/compat
+++ /dev/null
@@ -1 +0,0 @@
diff --git a/debian/control b/debian/control
deleted file mode 100644
index 2269755..0000000
--- a/debian/control
+++ /dev/null
@@ -1,25 +0,0 @@
-Source: r-bioc-go.db
-Maintainer: Debian Med Packaging Team <debian-med-packaging at lists.alioth.debian.org>
-Uploaders: Andreas Tille <tille at debian.org>
-Section: gnu-r
-Priority: optional
-Build-Depends: debhelper (>= 9),
- dh-r,
- r-base-dev,
- r-bioc-annotationdbi
-Standards-Version: 3.9.8
-Vcs-Browser: https://anonscm.debian.org/viewvc/debian-med/trunk/packages/R/r-bioc-go.db/trunk/
-Vcs-Svn: svn://anonscm.debian.org/debian-med/trunk/packages/R/r-bioc-go.db/trunk/
-Homepage: https://bioconductor.org/packages/GO.db/
-Package: r-bioc-go.db
-Architecture: all
-Depends: ${R:Depends},
- ${misc:Depends}
-Recommends: ${R:Recommends}
-Suggests: ${R:Suggests}
-Description: annotation maps describing the entire Gene Ontology
- This package is part of BioConductor and provides a set of annotation
- maps describing the entire Gene Ontology assembled using data from GO.
- .
- The package helps running the test suites of some BioConductor packages.
@@ -0,0 +1,35 @@
+\title{Bioconductor annotation data package}
+ Welcome to the GO.db annotation Package. The purpose of this
+ package is to provide detailed information about the latest version of the
+ Gene Ontologies. This package is updated biannually.
+ Objects in this package are accessed using the \code{select()} interface.
+ See ?select in the AnnotationDbi package for details.
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ \code{keys()}, \code{columns()} and \code{select()}.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+## The 'old style' of interacting with these objects is manipulation as
+## bimaps. While this approach is still available we strongly encourage the
+## use of select().
@@ -0,0 +1,54 @@
+\title{Annotation of GO Identifiers to their Biological Process Ancestors}
+ This data set describes associations between GO Biological Process (BP)
+ terms and their ancestor BP terms, based on the directed acyclic
+ graph (DAG) defined by the Gene Ontology Consortium. The format is an R
+ object mapping the GO BP terms to all ancestor terms, where an
+ ancestor term is a more general GO term that precedes
+ the given GO term in the DAG (in other words, the parents, and all
+ their parents, etc.).
+ Each GO BP term is mapped to a vector of ancestor GO BP terms.
+ Biological process is defined as the broad biological goals, such as
+ mitosis or purine metabolism, that are accomplished by ordered
+ assemblies of molecular functions as defined by Gene Ontology
+ Consortium.
+ Mappings were based on data provided by: Gene Ontology
+ ftp://ftp.geneontology.org/pub/go/godatabase/archive/latest-lite/
+ With a date stamp from the source of: 2016-Sep21
+\url{http://www.geneontology.org/} and
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+# Convert the object to a list
+xx <- as.list(GOBPANCESTOR)
+# Remove GO IDs that do not have any ancestor
+xx <- xx[!is.na(xx)]
+if(length(xx) > 0){
+ # Get the ancestor GO IDs for the first two elents of xx
+ goids <- xx[1:2]
@@ -0,0 +1,61 @@
+\title{Annotation of GO Identifiers to their Biological Process Children}
+This data set describes associations between GO molecular function (BP)
+ terms and their direct children BP terms, based on the directed acyclic
+ graph (DAG) defined by the Gene Ontology Consortium. The format is an R
+ object mapping the GO BP terms to all direct children terms, where a
+ direct child term is a more specific GO term that is immediately preceded
+ by the given GO term in the DAG.
+ Each GO BP term is mapped to a vector of children GO BP terms.
+ Biological process is defined as the broad biological goals, such as
+ mitosis or purine metabolism, that are accomplished by ordered
+ assemblies of molecular functions as defined by Gene Ontology
+ Consortium.
+ Mappings were based on data provided by: Gene Ontology
+ ftp://ftp.geneontology.org/pub/go/godatabase/archive/latest-lite/
+ With a date stamp from the source of: 2016-Sep21
+\url{http://www.geneontology.org/} and
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+# Convert the object to a list
+xx <- as.list(GOBPCHILDREN)
+# Remove GO IDs that do not have any children
+xx <- xx[!is.na(xx)]
+if(length(xx) > 0){
+ # Get the parent GO IDs for the first elents of xx
+ goids <- xx[[1]]
+ # Find out the GO terms for the first parent goid
+ GOID(GOTERM[[goids[1]]])
+ Term(GOTERM[[goids[1]]])
+ Synonym(GOTERM[[goids[1]]])
+ Secondary(GOTERM[[goids[1]]])
+ Definition(GOTERM[[goids[1]]])
+ Ontology(GOTERM[[goids[1]]])
@@ -0,0 +1,55 @@
+\title{Annotation of GO Identifiers to their Biological Process Offspring}
+ This data set describes associations between GO molecular function (BP)
+ terms and their offspring BP terms, based on the directed acyclic
+ graph (DAG) defined by the Gene Ontology Consortium. The format is an R
+ object mapping the GO BP terms to all offspring terms, where an
+ offspring term is a more specific GO term that is preceded
+ by the given GO term in the DAG (in other words, the children and all
+ their children, etc.).
+ Each GO BP term is mapped to a vector of offspring GO BP terms.
+ Biological process is defined as the broad biological goals, such as
+ mitosis or purine metabolism, that are accomplished by ordered
+ assemblies of molecular functions as defined by Gene Ontology
+ Consortium.
+ Mappings were based on data provided by: Gene Ontology
+ ftp://ftp.geneontology.org/pub/go/godatabase/archive/latest-lite/
+ With a date stamp from the source of: 2016-Sep21
+\url{http://www.geneontology.org/} and
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+# Convert the object to a list
+xx <- as.list(GOBPOFFSPRING)
+# Remove GO IDs that do not have any offspring
+xx <- xx[!is.na(xx)]
+if(length(xx) > 0){
+ # Get the offspring GO IDs for the first two elents of xx
+ goids <- xx[1:2]
@@ -0,0 +1,66 @@
+\title{Annotation of GO Identifiers to their Biological Process Parents}
+ This data set describes associations between GO molecular function (BP)
+ terms and their direct parent BP terms, based on the directed acyclic
+ graph (DAG) defined by the Gene Ontology Consortium. The format is an R
+ object mapping the GO BP terms to all direct parent terms, where a
+ direct parent term is a more general GO term that immediately precedes
+ the given GO term in the DAG.
+ Each GO BP term is mapped to a named vector of GO BP terms. The name
+ associated with the parent term will be either \emph{isa}, \emph{hasa} or \emph{partof},
+ where \emph{isa} indicates that the child term is a more specific version
+ of the parent, and \emph{hasa} and \emph{partof} indicate that the
+ child term is a part of the parent. For example, a telomere is part of
+ a chromosome.
+ Biological process is defined as the broad biological goals, such as
+ mitosis or purine metabolism, that are accomplished by ordered
+ assemblies of molecular functions as defined by Gene Ontology
+ Consortium.
+ Mappings were based on data provided: Gene Ontology
+ ftp://ftp.geneontology.org/pub/go/godatabase/archive/latest-lite/
+ With a date stamp from the source of: 2016-Sep21
+\url{http://www.geneontology.org/} and
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+# Convert the object to a list
+xx <- as.list(GOBPPARENTS)
+# Remove GO IDs that do not have any parent
+xx <- xx[!is.na(xx)]
+if(length(xx) > 0){
+ # Get the children GO IDs for the first elents of xx
+ goids <- xx[[1]]
+ # Find out the GO terms for the first parent goid
+ GOID(GOTERM[[goids[1]]])
+ Term(GOTERM[[goids[1]]])
+ Synonym(GOTERM[[goids[1]]])
+ Secondary(GOTERM[[goids[1]]])
+ Definition(GOTERM[[goids[1]]])
+ Ontology(GOTERM[[goids[1]]])
@@ -0,0 +1,54 @@
+\title{Annotation of GO Identifiers to their Cellular Component Ancestors}
+ This data set describes associations between GO molecular function (CC)
+ terms and their ancestor CC terms, based on the directed acyclic
+ graph (DAG) defined by the Gene Ontology Consortium. The format is an R
+ object mapping the GO CC terms to all ancestor terms, where an
+ ancestor term is a more general GO term that precedes
+ the given GO term in the DAG (in other words, the parents, and all
+ their parents, etc.).
+ Each GO CC term is mapped to a vector of ancestor GO C terms.
+ Cellular component is defined as the subcellular structures,
+ locations, and macromolecular complexes; examples include nucleus,
+ telomere, and origin recognition complex as defined by Gene Ontology
+ Consortium.
+ Mappings were based on data provided: Gene Ontology
+ ftp://ftp.geneontology.org/pub/go/godatabase/archive/latest-lite/
+ With a date stamp from the source of: 2016-Sep21
+\url{http://www.geneontology.org/} and
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+# Convert the object to a list
+xx <- as.list(GOCCANCESTOR)
+# Remove GO IDs that do not have any ancestor
+xx <- xx[!is.na(xx)]
+if(length(xx) > 0){
+ # Get the ancestor GO IDs for the first two elents of xx
+ goids <- xx[1:2]
@@ -0,0 +1,60 @@
+\title{Annotation of GO Identifiers to their Cellular Component Children}
+ This data set describes associations between GO molecular function (CC)
+ terms and their direct children CC terms, based on the directed acyclic
+ graph (DAG) defined by the Gene Ontology Consortium. The format is an R
+ object mapping the GO CC terms to all direct children terms, where a
+ direct child term is a more specific GO term that is immediately preceded
+ by the given GO term in the DAG.
+ Each GO CC term is mapped to a vector of children GO CC terms.
+ Cellular component is defined as the subcellular structures,
+ locations, and macromolecular complexes; examples include nucleus,
+ telomere, and origin recognition complex as defined by Gene Ontology
+ Consortium.
+ Mappings were based on data provided: Gene Ontology
+ ftp://ftp.geneontology.org/pub/go/godatabase/archive/latest-lite/
+ With a date stamp from the source of: 2016-Sep21
+\url{http://www.geneontology.org/} and
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+# Convert the object to a list
+xx <- as.list(GOCCCHILDREN)
+# Remove GO IDs that do not have any children
+xx <- xx[!is.na(xx)]
+if(length(xx) > 0){
+goids <- xx[[1]]
+# Find out the GO terms for the first parent goid
@@ -0,0 +1,54 @@
+\title{Annotation of GO Identifiers to their Cellular Component Offspring}
+ This data set describes associations between GO molecular function (MF)
+ terms and their offspring MF terms, based on the directed acyclic
+ graph (DAG) defined by the Gene Ontology Consortium. The format is an R
+ object mapping the GO MF terms to all offspring terms, where an
+ offspring term is a more specific GO term that is preceded
+ by the given GO term in the DAG (in other words, the children and all
+ their children, etc.).
+ Each GO CC term is mapped to a vector of offspring GO MF terms.
+ Cellular component is defined as the subcellular structures,
+ locations, and macromolecular complexes; examples include nucleus,
+ telomere, and origin recognition complex as defined b y Gene Ontology
+ Consortium.
+ Mappings were based on data provided: Gene Ontology
+ ftp://ftp.geneontology.org/pub/go/godatabase/archive/latest-lite/
+ With a date stamp from the source of: 2016-Sep21
+\url{http://www.geneontology.org/} and
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+# Convert the object to a list
+xx <- as.list(GOCCOFFSPRING)
+# Remove GO identifiers that do not have any offspring
+xx <- xx[!is.na(xx)]
+if(length(xx) > 0){
+ # Get the offspring GO identifiers for the first two elents of xx
+ goidentifiers <- xx[1:2]
@@ -0,0 +1,64 @@
+\title{Annotation of GO Identifiers to their Cellular Component Parents}
+ This data set describes associations between GO molecular function (CC)
+ terms and their direct parent CC terms, based on the directed acyclic
+ graph (DAG) defined by the Gene Ontology Consortium. The format is an R
+ object mapping the GO CC terms to all direct parent terms, where a
+ direct parent term is a more general GO term that immediately precedes
+ the given GO term in the DAG.
+ Each GO CC term is mapped to a named vector of GO CC terms. The name
+ associated with the parent term will be either \emph{isa}, \emph{hasa} or \emph{partof},
+ where \emph{isa} indicates that the child term is a more specific version
+ of the parent, and \emph{hasa} and \emph{partof} indicate that the
+ child term is a part of the parent. For example, a telomere is part of
+ a chromosome.
+ Cellular component is defined as the subcellular structures,
+ locations, and macromolecular complexes; examples include nucleus,
+ telomere, and origin recognition complex as defined b y Gene Ontology
+ Consortium.
+ Mappings were based on data provided: Gene Ontology
+ ftp://ftp.geneontology.org/pub/go/godatabase/archive/latest-lite/
+ With a date stamp from the source of: 2016-Sep21
+\url{http://www.geneontology.org/} and
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+# Convert the object to a list
+xx <- as.list(GOCCPARENTS)
+# Remove GO IDs that do not have any parent
+xx <- xx[!is.na(xx)]
+if(length(xx) > 0){
+ goids <- xx[[1]]
+ # Find out the GO terms for the first parent go ID
+ GOID(GOTERM[[goids[1]]])
+ Term(GOTERM[[goids[1]]])
+ Synonym(GOTERM[[goids[1]]])
+ Secondary(GOTERM[[goids[1]]])
+ Definition(GOTERM[[goids[1]]])
+ Ontology(GOTERM[[goids[1]]])
@@ -0,0 +1,51 @@
+\title{Number of mapped keys for the maps in package GO.db}
+ GOMAPCOUNTS provides the "map count" (i.e. the
+ count of mapped keys) for each map in package GO.db.
+ This "map count" information is precalculated and stored in the
+ package annotation DB. This allows some quality control and is used by
+ the \code{\link[AnnotationDbi:AnnDbPkg-checker]{checkMAPCOUNTS}}
+ function defined in AnnotationDbi to compare and validate different
+ methods (like \code{count.mappedkeys(x)} or
+ \code{sum(!is.na(as.list(x)))}) for getting the "map count" of a given
+ map.
+ \itemize{
+ \item \code{\link[AnnotationDbi:Bimap-keys]{mappedkeys}},
+ \item \code{\link[AnnotationDbi:Bimap-keys]{count.mappedkeys}},
+ \item \code{\link[AnnotationDbi:AnnDbPkg-checker]{checkMAPCOUNTS}}
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+mapnames <- names(GOMAPCOUNTS)
+x <- get(mapnames[1])
+count.mappedkeys(x) # much faster!
+## Check the "map count" of all the maps in package GO.db
@@ -0,0 +1,55 @@
+\title{Annotation of GO identifiers to their Molecular Function Ancestors}
+ This data set describes associations between GO molecular function (MF)
+ terms and their ancestor MF terms, based on the directed acyclic
+ graph (DAG) defined by the Gene Ontology Consortium. The format is an R
+ object mapping the GO MF terms to all ancestor terms, where an
+ ancestor term is a more general GO term that precedes
+ the given GO term in the DAG (in other words, the parents, and all
+ their parents, etc.).
+ Each GO MF term is mapped to a vector of ancestor GO MF terms.
+ Molecular function is defined as the tasks performed by individual
+ gene products; examples are transcription factor and DNA helicase as
+ defined by Gene Ontology Consortium.
+ Mappings were based on data provided: Gene Ontology
+ ftp://ftp.geneontology.org/pub/go/godatabase/archive/latest-lite/
+ With a date stamp from the source of: 2016-Sep21
+\url{http://www.geneontology.org/} and
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+# Convert the object to a list
+xx <- as.list(GOMFANCESTOR)
+# Remove GO identifiers that do not have any ancestor
+xx <- xx[!is.na(xx)]
+if(length(xx) > 0){
+ # Get the ancestor GO identifiers for the first two elents of xx
+ goids <- xx[1:2]
@@ -0,0 +1,60 @@
+\title{Annotation of GO Identifiers to their Molecular Function Children}
+ This data set describes associations between GO molecular function (MF)
+ terms and their direct children MF terms, based on the directed acyclic
+ graph (DAG) defined by the Gene Ontology Consortium. The format is an R
+ object mapping the GO MF terms to all direct children terms, where a
+ direct child term is a more specific GO term that is immediately preceded
+ by the given GO term in the DAG.
+ Each GO MF term is mapped to a vector of children GO MF terms.
+ Molecular function is defined as the tasks performed by individual
+ gene products; examples are transcription factor and DNA helicase as
+ defined by Gene Ontology Consortium.
+ Mappings were based on data provided by: Gene Ontology
+ ftp://ftp.geneontology.org/pub/go/godatabase/archive/latest-lite/
+ With a date stamp from the source of: 2016-Sep21
+\url{http://www.geneontology.org/} and
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+# Convert the object to a list
+xx <- as.list(GOMFCHILDREN)
+# Remove GO identifiers that do not have any children
+xx <- xx[!is.na(xx)]
+if(length(xx) > 0){
+ # Get the children GO identifiers for the first elents of xx
+ goids <- xx[[1]]
+ # Find out the GO terms for the first parent goid
+ GOID(GOTERM[[goids[1]]])
+ Term(GOTERM[[goids[1]]])
+ Synonym(GOTERM[[goids[1]]])
+ Secondary(GOTERM[[goids[1]]])
+ Definition(GOTERM[[goids[1]]])
+ Ontology(GOTERM[[goids[1]]])
@@ -0,0 +1,54 @@
+\title{Annotation of GO Identifiers to their Molecular Function Offspring}
+ This data set describes associations between GO molecular function (MF)
+ terms and their offspring MF terms, based on the directed acyclic
+ graph (DAG) defined by the Gene Ontology Consortium. The format is an R
+ object mapping the GO MF terms to all offspring terms, where an
+ offspring term is a more specific GO term that is preceded
+ by the given GO term in the DAG (in other words, the children and all
+ their children, etc.).
+ Each GO MF term is mapped to a vector of offspring GO MF terms.
+ Molecular function is defined as the tasks performed by individual
+ gene products; examples are transcription factor and DNA helicase as
+ defined by Gene Ontology Consortium.
+ Mappings were based on data provided by: Gene Ontology
+ ftp://ftp.geneontology.org/pub/go/godatabase/archive/latest-lite/
+ With a date stamp from the source of: 2016-Sep21
+\url{http://www.geneontology.org/} and
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+# Convert the object to a list
+xx <- as.list(GOMFOFFSPRING)
+# Remove GO identifiers that do not have any offspring
+xx <- xx[!is.na(xx)]
+if(length(xx) > 0){
+ # Get the offspring GO identifiers for the first two elents of xx
+goids <- xx[1:2]
@@ -0,0 +1,66 @@
+\title{Annotation of GO Identifiers to their Molecular Function Parents}
+ This data set describes associations between GO molecular function (MF)
+ terms and their direct parent MF terms, based on the directed acyclic
+ graph (DAG) defined by the Gene Ontology Consortium. The format is an R
+ object mapping the GO MF terms to all direct parent terms, where a
+ direct parent term is a more general GO term that immediately precedes
+ the given GO term in the DAG.
+ Each GO MF term is mapped to a named vector of GO MF terms. The name
+ associated with the parent term will be either \emph{isa}, \emph{hasa} or \emph{partof},
+ where \emph{isa} indicates that the child term is a more specific version
+ of the parent, and \emph{hasa} and \emph{partof} indicate that the
+ child term is a part of the parent. For example, a telomere is part of
+ a chromosome.
+ Molecular function is defined as the tasks performed by individual
+ gene products; examples are transcription factor and DNA helicase as
+ defined by the Gene Ontology Consortium.
+ Mappings were based on data provided by: Gene Ontology
+ ftp://ftp.geneontology.org/pub/go/godatabase/archive/latest-lite/
+ With a date stamp from the source of: 2016-Sep21
+ \url{http://www.geneontology.org/} and
+ \url{https://www.ncib.nlm.nih.gov/entrez/query.fcgi?db=gene}
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+# Convert the object to a list
+xx <- as.list(GOMFPARENTS)
+# Remove GO identifiers that do not have any parent
+xx <- xx[!is.na(xx)]
+if(length(xx) > 0){
+ # Get the parent GO identifiers for the first elents of xx
+ goids <- xx[[1]]
+ # Find out the GO terms for the first parent goid
+ GOID(GOTERM[[goids[1]]])
+ Term(GOTERM[[goids[1]]])
+ Synonym(GOTERM[[goids[1]]])
+ Secondary(GOTERM[[goids[1]]])
+ Definition(GOTERM[[goids[1]]])
+ Ontology(GOTERM[[goids[1]]])
@@ -0,0 +1,44 @@
+\title{Annotation of GO identifiers by terms defined by Gene Ontology
+ Consortium and their status are obsolete}
+This is an R object mapping GO identifiers to the specific
+terms in defined by Gene Ontology Consortium and their definition are obsolete
+ All the obsolete GO terms that are collected in this index will no longer exist
+ in other mapping objects.
+ Mappings were based on data provided by: Gene Ontology
+ ftp://ftp.geneontology.org/pub/go/godatabase/archive/latest-lite/
+ With a date stamp from the source of: 2016-Sep21
+ \url{https://www.ncib.nlm.nih.gov/LocusLink}
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+# Convert the object to a list
+xx <- as.list(GOTERM)
+if(length(xx) > 0){
+ # Get the TERMS for the first elent of xx
+ GOID(xx[[1]])
+ Ontology(xx[[1]])
diff --git a/man/GOSYNONYM.Rd b/man/GOSYNONYM.Rd
@@ -0,0 +1,34 @@
+\title{Map from GO synonyms to GO terms}
+ GOSYNONYM is an R object that provides mapping
+ from GO synonyms to GO terms
+ [TODO: Put some details here]
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+sample(x, 3)
+# GO ID "GO:0009435" has a lot of synonyms
+# GO ID "GO:0006736" is a synonym of GO ID "GO:0009435"
@@ -0,0 +1,60 @@
+\title{Annotation of GO Identifiers to GO Terms}
+ This data set gives mappings between GO identifiers and their respective terms.
+ Each GO identifier is mapped to a \code{GOTerms} object that has 6 slots:
+ GOID: GO Identifier
+ Term: The term for that GO id
+ Synonym: Synonymous terms
+ Secondary: Secondary terms that have been merged into this term
+ Definition: Further definition of the GO term
+ Ontology: One of MF - molecular function, BP - biological
+ process, or CC - cellular component
+ All the obsolete GO terms are under the nodes "obsolete molecular
+ function" (GO:0008369), "obsolete cellular component" (GO id
+ GO:0008370), and "obsolete biological process" (GO:0008371). Each of
+ these GO identifiers has a group of GO identifiers as their direct children with GO
+ terms that were defined by GO but are
+ deprecated in the current build. These deprecated GO terms were
+ appended by "(obsolete)" when the data package was built.
+ Mappings were based on data provided by: Gene Ontology
+ ftp://ftp.geneontology.org/pub/go/godatabase/archive/latest-lite/
+ With a date stamp from the source of: 2016-Sep21
+ \url{https://www.ncib.nlm.nih.gov/entrez/query.fcgi?db=gene}
+ \itemize{
+ \item \code{\link[AnnotationDbi]{AnnotationDb-class}} for use of
+ the \code{select()} interface.
+ }
+## select() interface:
+## Objects in this package can be accessed using the select() interface
+## from the AnnotationDbi package. See ?select for details.
+## Bimap interface:
+# Convert the object to a list
+xx <- as.list(GOTERM)
+if(length(xx) > 0){
+ # Get the TERMS for the first elent of xx
+ GOID(xx[[1]])
+ Term(xx[[1]])
+ Synonym(xx[[1]])
+ Secondary(xx[[1]])
+ Definition(xx[[1]])
+ Ontology(xx[[1]])
@@ -0,0 +1,87 @@
+\title{Collect information about the package annotation DB}
+ Some convenience functions for getting a connection object to (or collecting
+ information about) the package annotation DB.
+ GO_dbconn()
+ GO_dbfile()
+ GO_dbschema(file="", show.indices=FALSE)
+ GO_dbInfo()
+ \item{file}{
+ A connection, or a character string naming the file to print to (see
+ the \code{file} argument of the \code{\link[base]{cat}} function for
+ the details).
+ }
+ \item{show.indices}{
+ The CREATE INDEX statements are not shown by default.
+ Use \code{show.indices=TRUE} to get them.
+ }
+ \code{GO_dbconn} returns a connection object to the
+ package annotation DB. IMPORTANT: Don't call
+ \code{\link[DBI:dbConnect]{dbDisconnect}} on the connection object
+ returned by \code{GO_dbconn} or you will break all the
+ \code{\link[AnnotationDbi:AnnDbObj-class]{AnnDbObj}} objects defined
+ in this package!
+ \code{GO_dbfile} returns the path (character string) to the
+ package annotation DB (this is an SQLite file).
+ \code{GO_dbschema} prints the schema definition of the
+ package annotation DB.
+ \code{GO_dbInfo} prints other information about the package
+ annotation DB.
+ \code{GO_dbconn}: a DBIConnection object representing an
+ open connection to the package annotation DB.
+ \code{GO_dbfile}: a character string with the path to the
+ package annotation DB.
+ \code{GO_dbschema}: none (invisible \code{NULL}).
+ \code{GO_dbInfo}: none (invisible \code{NULL}).
+ \code{\link[DBI:dbSendQuery]{dbGetQuery}},
+ \code{\link[DBI:dbConnect]{dbConnect}},
+ \code{\link[AnnotationDbi:AnnDbObj-class]{dbconn}},
+ \code{\link[AnnotationDbi:AnnDbObj-class]{dbfile}},
+ \code{\link[AnnotationDbi:AnnDbObj-class]{dbschema}},
+ \code{\link[AnnotationDbi:AnnDbObj-class]{dbInfo}}
+ library(DBI)
+ ## Count the number of rows in the "go_term" table:
+ dbGetQuery(GO_dbconn(), "SELECT COUNT(*) FROM go_term")
+ GO_dbschema()
+ GO_dbInfo()
