veekun_pokedex/pokedex/db/__init__.py

87 lines
3 KiB
Python
Raw Normal View History

# encoding: utf-8
import re
from sqlalchemy import engine_from_config, orm
from ..defaults import get_default_db_uri
from .tables import Language, metadata
from .multilang import MultilangSession, MultilangScopedSession
def connect(uri=None, session_args={}, engine_args={}, engine_prefix=''):
"""Connects to the requested URI. Returns a session object.
With the URI omitted, attempts to connect to a default SQLite database
contained within the package directory.
Calling this function also binds the metadata object to the created engine.
"""
# If we didn't get a uri, fall back to the default
if uri is None:
2011-03-12 14:46:04 +00:00
uri = engine_args.get(engine_prefix + 'url', None)
if uri is None:
uri = get_default_db_uri()
### Do some fixery for MySQL
if uri.startswith('mysql:'):
# MySQL uses latin1 for connections by default even if the server is
# otherwise oozing with utf8; charset fixes this
if 'charset' not in uri:
uri += '?charset=utf8'
# Tables should be InnoDB, in the event that we're creating them, and
# use UTF-8 goddammit!
for table in metadata.tables.values():
table.kwargs['mysql_engine'] = 'InnoDB'
table.kwargs['mysql_charset'] = 'utf8'
### Connect
engine_args[engine_prefix + 'url'] = uri
engine = engine_from_config(engine_args, prefix=engine_prefix)
conn = engine.connect()
metadata.bind = engine
all_session_args = dict(autoflush=True, autocommit=False, bind=engine)
all_session_args.update(session_args)
sm = orm.sessionmaker(class_=MultilangSession, language_class=Language,
**all_session_args)
session = MultilangScopedSession(sm)
2011-04-06 06:34:28 +00:00
# Default to English. Warning, magic constant, messing with internals,
# blah blah. Trying to fetch English here would kinda break on new
# databases. TODO still not an ideal solution, I guess.
session.registry()._default_language_id = 9
return session
def identifier_from_name(name):
"""Make a string safe to use as an identifier.
Valid characters are lowercase alphanumerics and "-". This function may
raise ValueError if it can't come up with a suitable identifier.
This function is useful for scripts which add things with names.
"""
if isinstance(name, str):
identifier = name.decode('utf-8')
else:
identifier = name
identifier = identifier.lower()
identifier = identifier.replace(u'+', u' plus ')
identifier = re.sub(u'[ _]+', u'-', identifier)
identifier = re.sub(u"['./;(),:]", u'', identifier)
identifier = identifier.replace(u'é', u'e')
identifier = identifier.replace(u'', u'-f')
identifier = identifier.replace(u'', u'-m')
if identifier in (u'???', u'????'):
identifier = u'unknown'
elif identifier == u'!':
identifier = u'exclamation'
elif identifier == u'?':
identifier = u'question'
if not identifier.replace(u"-", u"").isalnum():
raise ValueError(identifier)
return identifier