1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127
|
#!/usr/bin/env python
import MySQLdb
import sqlalchemy as sql
from cogent.util.table import Table
from cogent.db.ensembl.species import Species
from cogent.db.ensembl.name import EnsemblDbName
from cogent.db.ensembl.util import asserted_one
__author__ = "Gavin Huttley"
__copyright__ = "Copyright 2007, The Cogent Project"
__credits__ = ["Gavin Huttley"]
__license__ = "GPL"
__version__ = "1.4.1"
__maintainer__ = "Gavin Huttley"
__email__ = "Gavin.Huttley@anu.edu.au"
__status__ = "alpha"
class HostAccount(object):
"""host account data"""
def __init__(self, host, user, passwd, port=None):
super(HostAccount, self).__init__()
self.host = host
self.user = user
self.passwd = passwd
self.port = port or 3306
def __cmp__(self, other):
return cmp((self.host, self.user, self.port),
(other.host, other.user, other.port))
def __str__(self):
return '%s:%s@%s:%s' % (self.user,self.passwd,self.host,self.port)
def get_ensembl_account(release=None):
"""returns an HostAccount for ensembl.
Arguments:
- release: if not specified, returns for the ensembl MySQL server
hosting releases from 48"""
port = [None, 5306][release is None or int(release) > 47]
return HostAccount("ensembldb.ensembl.org", "anonymous", "", port=port)
def _get_default_connection():
return "ensembldb.ensembl.org", "anonymous", ""
class EngineCache(object):
"""storage of active connections, indexed by account, database name"""
_db_account = {}
def __call__(self, account, db_name=None, pool_recycle=None):
"""returns an active SQLAlchemy connection engine"""
assert account and db_name,"Must provide an account and a db"
pool_recycle = pool_recycle or 3600
if account not in self._db_account.get(db_name, []):
if db_name == "PARENT":
engine = MySQLdb.connect(host=account.host, user=account.user,
passwd=account.passwd, port=account.port)
else:
engine = sql.create_engine("mysql://%s/%s" % (account,
db_name), pool_recycle=pool_recycle)
if db_name not in self._db_account:
self._db_account[db_name] = {}
self._db_account[db_name][account] = engine
return self._db_account[db_name][account]
DbConnection = EngineCache()
def make_db_name_pattern(species=None, db_type=None, release=None):
"""returns a pattern for matching the db name against"""
sep = r"%"
pattern = ""
if species:
species = Species.getEnsemblDbPrefix(species)
pattern = "%s%s" % (sep, species)
if db_type:
pattern = "%s%s%s" % (pattern, sep, db_type)
if release:
pattern = "%s%s%s" % (pattern, sep, release)
assert pattern
return "'%s%s'" % (pattern, sep)
def get_db_name(account=None, species=None, db_type=None, release=None,
DEBUG=False):
"""returns the listing of valid data-base names as EnsemblDbName objects"""
if account is None:
account = get_ensembl_account(release=release)
if DEBUG:
print "Connection To:", account
print "Selecting For:", species, db_type, release
server = DbConnection(account, db_name='PARENT')
cursor = server.cursor()
show = "SHOW DATABASES"
if species or db_type or release:
pattern = make_db_name_pattern(species, db_type, release)
show = "%s LIKE %s" % (show, pattern)
if DEBUG:
print show
cursor.execute(show)
rows = cursor.fetchall()
dbs = []
for row in rows:
try:
name = EnsemblDbName(row[0])
if (release is None or name.Release == str(release)) and\
(db_type is None or name.Type == db_type):
dbs.append(name)
except (IndexError, RuntimeError):
if DEBUG:
print "FAIL:", row[0]
continue
return dbs
def get_latest_release(account = None):
"""returns the number of the latest release based on the compara db"""
names = get_db_name(account=account, db_type="compara")
compara = []
for name in names:
compara += [int(name.Release)]
return str(max(compara))
if __name__ == "__main__":
eaccount = get_ensembl_account(release='48')
print get_db_name(account=eaccount, release="48", db_type='compara')
print get_latest_release()
|