--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/cubicweb/server/repository.py Sat Jan 16 13:48:51 2016 +0100
@@ -0,0 +1,1133 @@
+# copyright 2003-2014 LOGILAB S.A. (Paris, FRANCE), all rights reserved.
+# contact http://www.logilab.fr/ -- mailto:contact@logilab.fr
+#
+# This file is part of CubicWeb.
+#
+# CubicWeb is free software: you can redistribute it and/or modify it under the
+# terms of the GNU Lesser General Public License as published by the Free
+# Software Foundation, either version 2.1 of the License, or (at your option)
+# any later version.
+#
+# CubicWeb is distributed in the hope that it will be useful, but WITHOUT
+# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
+# FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for more
+# details.
+#
+# You should have received a copy of the GNU Lesser General Public License along
+# with CubicWeb. If not, see <http://www.gnu.org/licenses/>.
+"""Defines the central class for the CubicWeb RQL server: the repository.
+
+The repository is an abstraction allowing execution of rql queries against
+data sources. Most of the work is actually done in helper classes. The
+repository mainly:
+
+* brings these classes all together to provide a single access
+ point to a cubicweb instance.
+* handles session management
+"""
+from __future__ import print_function
+
+__docformat__ = "restructuredtext en"
+
+import threading
+from warnings import warn
+from itertools import chain
+from time import time, localtime, strftime
+from contextlib import contextmanager
+
+from six.moves import range, queue
+
+from logilab.common.decorators import cached, clear_cache
+from logilab.common.deprecation import deprecated
+
+from yams import BadSchemaDefinition
+from rql.utils import rqlvar_maker
+
+from cubicweb import (CW_MIGRATION_MAP, QueryError,
+ UnknownEid, AuthenticationError, ExecutionError,
+ BadConnectionId, ValidationError, Unauthorized,
+ UniqueTogetherError, onevent, ViolatedConstraint)
+from cubicweb import cwvreg, schema, server
+from cubicweb.server import ShuttingDown, utils, hook, querier, sources
+from cubicweb.server.session import Session, InternalManager
+
+NO_CACHE_RELATIONS = set( [('owned_by', 'object'),
+ ('created_by', 'object'),
+ ('cw_source', 'object'),
+ ])
+
+def prefill_entity_caches(entity):
+ cnx = entity._cw
+ # prefill entity relation caches
+ for rschema in entity.e_schema.subject_relations():
+ rtype = str(rschema)
+ if rtype in schema.VIRTUAL_RTYPES or (rtype, 'subject') in NO_CACHE_RELATIONS:
+ continue
+ if rschema.final:
+ entity.cw_attr_cache.setdefault(rtype, None)
+ else:
+ entity.cw_set_relation_cache(rtype, 'subject',
+ cnx.empty_rset())
+ for rschema in entity.e_schema.object_relations():
+ rtype = str(rschema)
+ if rtype in schema.VIRTUAL_RTYPES or (rtype, 'object') in NO_CACHE_RELATIONS:
+ continue
+ entity.cw_set_relation_cache(rtype, 'object', cnx.empty_rset())
+
+def del_existing_rel_if_needed(cnx, eidfrom, rtype, eidto):
+ """delete existing relation when adding a new one if card is 1 or ?
+
+ have to be done once the new relation has been inserted to avoid having
+ an entity without a relation for some time
+
+ this kind of behaviour has to be done in the repository so we don't have
+ hooks order hazardness
+ """
+ # skip that if integrity explicitly disabled
+ if not cnx.is_hook_category_activated('activeintegrity'):
+ return
+ rdef = cnx.rtype_eids_rdef(rtype, eidfrom, eidto)
+ card = rdef.cardinality
+ # one may be tented to check for neweids but this may cause more than one
+ # relation even with '1?' cardinality if thoses relations are added in the
+ # same transaction where the entity is being created. This never occurs from
+ # the web interface but may occurs during test or dbapi connection (though
+ # not expected for this). So: don't do it, we pretend to ensure repository
+ # consistency.
+ #
+ # notes:
+ # * inlined relations will be implicitly deleted for the subject entity
+ # * we don't want read permissions to be applied but we want delete
+ # permission to be checked
+ if card[0] in '1?':
+ with cnx.security_enabled(read=False):
+ cnx.execute('DELETE X %s Y WHERE X eid %%(x)s, '
+ 'NOT Y eid %%(y)s' % rtype,
+ {'x': eidfrom, 'y': eidto})
+ if card[1] in '1?':
+ with cnx.security_enabled(read=False):
+ cnx.execute('DELETE X %s Y WHERE Y eid %%(y)s, '
+ 'NOT X eid %%(x)s' % rtype,
+ {'x': eidfrom, 'y': eidto})
+
+
+def preprocess_inlined_relations(cnx, entity):
+ """when an entity is added, check if it has some inlined relation which
+ requires to be extrated for proper call hooks
+ """
+ relations = []
+ activeintegrity = cnx.is_hook_category_activated('activeintegrity')
+ eschema = entity.e_schema
+ for attr in entity.cw_edited:
+ rschema = eschema.subjrels[attr]
+ if not rschema.final: # inlined relation
+ value = entity.cw_edited[attr]
+ relations.append((attr, value))
+ cnx.update_rel_cache_add(entity.eid, attr, value)
+ rdef = cnx.rtype_eids_rdef(attr, entity.eid, value)
+ if rdef.cardinality[1] in '1?' and activeintegrity:
+ with cnx.security_enabled(read=False):
+ cnx.execute('DELETE X %s Y WHERE Y eid %%(y)s' % attr,
+ {'x': entity.eid, 'y': value})
+ return relations
+
+
+class NullEventBus(object):
+ def publish(self, msg):
+ pass
+
+ def add_subscription(self, topic, callback):
+ pass
+
+ def start(self):
+ pass
+
+ def stop(self):
+ pass
+
+
+class Repository(object):
+ """a repository provides access to a set of persistent storages for
+ entities and relations
+ """
+
+ def __init__(self, config, tasks_manager=None, vreg=None):
+ self.config = config
+ if vreg is None:
+ vreg = cwvreg.CWRegistryStore(config)
+ self.vreg = vreg
+ self._tasks_manager = tasks_manager
+
+ self.app_instances_bus = NullEventBus()
+ self.info('starting repository from %s', self.config.apphome)
+ # dictionary of opened sessions
+ self._sessions = {}
+
+ # list of functions to be called at regular interval
+ # list of running threads
+ self._running_threads = []
+ # initial schema, should be build or replaced latter
+ self.schema = schema.CubicWebSchema(config.appid)
+ self.vreg.schema = self.schema # until actual schema is loaded...
+ # shutdown flag
+ self.shutting_down = False
+ # sources (additional sources info in the system database)
+ self.system_source = self.get_source('native', 'system',
+ config.system_source_config.copy())
+ self.sources_by_uri = {'system': self.system_source}
+ # querier helper, need to be created after sources initialization
+ self.querier = querier.QuerierHelper(self, self.schema)
+ # cache eid -> (type, extid, actual source)
+ self._type_source_cache = {}
+ # cache extid -> eid
+ self._extid_cache = {}
+ # open some connection sets
+ if config.init_cnxset_pool:
+ self.init_cnxset_pool()
+ # the hooks manager
+ self.hm = hook.HooksManager(self.vreg)
+ # registry hook to fix user class on registry reload
+ @onevent('after-registry-reload', self)
+ def fix_user_classes(self):
+ # After registry reload the 'CWUser' class used for CWEtype
+ # changed. So any existing user object have a different class than
+ # the new loaded one. We are hot fixing this.
+ usercls = self.vreg['etypes'].etype_class('CWUser')
+ for session in self._sessions.values():
+ if not isinstance(session.user, InternalManager):
+ session.user.__class__ = usercls
+
+ def init_cnxset_pool(self):
+ """should be called bootstrap_repository, as this is what it does"""
+ config = self.config
+ self._cnxsets_pool = queue.Queue()
+ # 0. init a cnxset that will be used to fetch bootstrap information from
+ # the database
+ self._cnxsets_pool.put_nowait(self.system_source.wrapped_connection())
+ # 1. set used cubes
+ if config.creating or not config.read_instance_schema:
+ config.bootstrap_cubes()
+ else:
+ self.set_schema(self.config.load_bootstrap_schema(), resetvreg=False)
+ config.init_cubes(self.get_cubes())
+ # 2. load schema
+ if config.quick_start:
+ # quick start: only to get a minimal repository to get cubes
+ # information (eg dump/restore/...)
+ #
+ # restrict appobject_path to only load hooks and entity classes in
+ # the registry
+ config.cube_appobject_path = set(('hooks', 'entities'))
+ config.cubicweb_appobject_path = set(('hooks', 'entities'))
+ # limit connections pool to 1
+ config['connections-pool-size'] = 1
+ if config.quick_start or config.creating or not config.read_instance_schema:
+ # load schema from the file system
+ if not config.creating:
+ self.info("set fs instance'schema")
+ self.set_schema(config.load_schema(expand_cubes=True))
+ else:
+ # normal start: load the instance schema from the database
+ self.info('loading schema from the repository')
+ self.set_schema(self.deserialize_schema())
+ # 3. initialize data sources
+ if config.creating:
+ # call init_creating so that for instance native source can
+ # configurate tsearch according to postgres version
+ self.system_source.init_creating()
+ else:
+ self.init_sources_from_database()
+ if 'CWProperty' in self.schema:
+ self.vreg.init_properties(self.properties())
+ # 4. close initialization connection set and reopen fresh ones for
+ # proper initialization
+ self._get_cnxset().close(True)
+ self.cnxsets = [] # list of available cnxsets (can't iterate on a Queue)
+ for i in range(config['connections-pool-size']):
+ self.cnxsets.append(self.system_source.wrapped_connection())
+ self._cnxsets_pool.put_nowait(self.cnxsets[-1])
+
+ # internals ###############################################################
+
+ def init_sources_from_database(self):
+ self.sources_by_eid = {}
+ if self.config.quick_start \
+ or not 'CWSource' in self.schema: # # 3.10 migration
+ self.system_source.init_creating()
+ return
+ with self.internal_cnx() as cnx:
+ # FIXME: sources should be ordered (add_entity priority)
+ for sourceent in cnx.execute(
+ 'Any S, SN, SA, SC WHERE S is_instance_of CWSource, '
+ 'S name SN, S type SA, S config SC').entities():
+ if sourceent.name == 'system':
+ self.system_source.eid = sourceent.eid
+ self.sources_by_eid[sourceent.eid] = self.system_source
+ self.system_source.init(True, sourceent)
+ continue
+ self.add_source(sourceent)
+
+ def _clear_planning_caches(self):
+ clear_cache(self, 'source_defs')
+
+ def add_source(self, sourceent):
+ try:
+ source = self.get_source(sourceent.type, sourceent.name,
+ sourceent.host_config, sourceent.eid)
+ except RuntimeError:
+ if self.config.repairing:
+ self.exception('cant setup source %s, skipped', sourceent.name)
+ return
+ raise
+ self.sources_by_eid[sourceent.eid] = source
+ self.sources_by_uri[sourceent.name] = source
+ if self.config.source_enabled(source):
+ # call source's init method to complete their initialisation if
+ # needed (for instance looking for persistent configuration using an
+ # internal session, which is not possible until connections sets have been
+ # initialized)
+ source.init(True, sourceent)
+ else:
+ source.init(False, sourceent)
+ self._clear_planning_caches()
+
+ def remove_source(self, uri):
+ source = self.sources_by_uri.pop(uri)
+ del self.sources_by_eid[source.eid]
+ self._clear_planning_caches()
+
+ def get_source(self, type, uri, source_config, eid=None):
+ # set uri and type in source config so it's available through
+ # source_defs()
+ source_config['uri'] = uri
+ source_config['type'] = type
+ return sources.get_source(type, source_config, self, eid)
+
+ def set_schema(self, schema, resetvreg=True):
+ self.info('set schema %s %#x', schema.name, id(schema))
+ if resetvreg:
+ # trigger full reload of all appobjects
+ self.vreg.set_schema(schema)
+ else:
+ self.vreg._set_schema(schema)
+ self.querier.set_schema(schema)
+ for source in self.sources_by_uri.values():
+ source.set_schema(schema)
+ self.schema = schema
+
+ def deserialize_schema(self):
+ """load schema from the database"""
+ from cubicweb.server.schemaserial import deserialize_schema
+ appschema = schema.CubicWebSchema(self.config.appid)
+ self.debug('deserializing db schema into %s %#x', appschema.name, id(appschema))
+ with self.internal_cnx() as cnx:
+ try:
+ deserialize_schema(appschema, cnx)
+ except BadSchemaDefinition:
+ raise
+ except Exception as ex:
+ import traceback
+ traceback.print_exc()
+ raise Exception('Is the database initialised ? (cause: %s)' % ex)
+ return appschema
+
+ def _prepare_startup(self):
+ """Prepare "Repository as a server" for startup.
+
+ * trigger server startup hook,
+ * register session clean up task.
+ """
+ if not (self.config.creating or self.config.repairing
+ or self.config.quick_start):
+ # call instance level initialisation hooks
+ self.hm.call_hooks('server_startup', repo=self)
+ # register a task to cleanup expired session
+ self.cleanup_session_time = self.config['cleanup-session-time'] or 60 * 60 * 24
+ assert self.cleanup_session_time > 0
+ cleanup_session_interval = min(60*60, self.cleanup_session_time / 3)
+ assert self._tasks_manager is not None, "This Repository is not intended to be used as a server"
+ self._tasks_manager.add_looping_task(cleanup_session_interval,
+ self.clean_sessions)
+
+ def start_looping_tasks(self):
+ """Actual "Repository as a server" startup.
+
+ * trigger server startup hook,
+ * register session clean up task,
+ * start all tasks.
+
+ XXX Other startup related stuffs are done elsewhere. In Repository
+ XXX __init__ or in external codes (various server managers).
+ """
+ self._prepare_startup()
+ assert self._tasks_manager is not None, "This Repository is not intended to be used as a server"
+ self._tasks_manager.start()
+
+ def looping_task(self, interval, func, *args):
+ """register a function to be called every `interval` seconds.
+
+ looping tasks can only be registered during repository initialization,
+ once done this method will fail.
+ """
+ assert self._tasks_manager is not None, "This Repository is not intended to be used as a server"
+ self._tasks_manager.add_looping_task(interval, func, *args)
+
+ def threaded_task(self, func):
+ """start function in a separated thread"""
+ utils.RepoThread(func, self._running_threads).start()
+
+ #@locked
+ def _get_cnxset(self):
+ try:
+ return self._cnxsets_pool.get(True, timeout=5)
+ except queue.Empty:
+ raise Exception('no connections set available after 5 secs, probably either a '
+ 'bug in code (too many uncommited/rolled back '
+ 'connections) or too much load on the server (in '
+ 'which case you can try to set a bigger '
+ 'connections pool size)')
+
+ def _free_cnxset(self, cnxset):
+ self._cnxsets_pool.put_nowait(cnxset)
+
+ def shutdown(self):
+ """called on server stop event to properly close opened sessions and
+ connections
+ """
+ assert not self.shutting_down, 'already shutting down'
+ if not (self.config.creating or self.config.repairing
+ or self.config.quick_start):
+ # then, the system source is still available
+ self.hm.call_hooks('before_server_shutdown', repo=self)
+ self.shutting_down = True
+ self.system_source.shutdown()
+ if self._tasks_manager is not None:
+ self._tasks_manager.stop()
+ if not (self.config.creating or self.config.repairing
+ or self.config.quick_start):
+ self.hm.call_hooks('server_shutdown', repo=self)
+ for thread in self._running_threads:
+ self.info('waiting thread %s...', thread.getName())
+ thread.join()
+ self.info('thread %s finished', thread.getName())
+ self.close_sessions()
+ while not self._cnxsets_pool.empty():
+ cnxset = self._cnxsets_pool.get_nowait()
+ try:
+ cnxset.close(True)
+ except Exception:
+ self.exception('error while closing %s' % cnxset)
+ continue
+ hits, misses = self.querier.cache_hit, self.querier.cache_miss
+ try:
+ self.info('rql st cache hit/miss: %s/%s (%s%% hits)', hits, misses,
+ (hits * 100) / (hits + misses))
+ hits, misses = self.system_source.cache_hit, self.system_source.cache_miss
+ self.info('sql cache hit/miss: %s/%s (%s%% hits)', hits, misses,
+ (hits * 100) / (hits + misses))
+ nocache = self.system_source.no_cache
+ self.info('sql cache usage: %s/%s (%s%%)', hits+ misses, nocache,
+ ((hits + misses) * 100) / (hits + misses + nocache))
+ except ZeroDivisionError:
+ pass
+
+ def check_auth_info(self, cnx, login, authinfo):
+ """validate authentication, raise AuthenticationError on failure, return
+ associated CWUser's eid on success.
+ """
+ # iter on sources_by_uri then check enabled source since sources doesn't
+ # contain copy based sources
+ for source in self.sources_by_uri.values():
+ if self.config.source_enabled(source) and source.support_entity('CWUser'):
+ try:
+ return source.authenticate(cnx, login, **authinfo)
+ except AuthenticationError:
+ continue
+ else:
+ raise AuthenticationError('authentication failed with all sources')
+
+ def authenticate_user(self, cnx, login, **authinfo):
+ """validate login / password, raise AuthenticationError on failure
+ return associated CWUser instance on success
+ """
+ eid = self.check_auth_info(cnx, login, authinfo)
+ cwuser = self._build_user(cnx, eid)
+ if self.config.consider_user_state and \
+ not cwuser.cw_adapt_to('IWorkflowable').state in cwuser.AUTHENTICABLE_STATES:
+ raise AuthenticationError('user is not in authenticable state')
+ return cwuser
+
+ def _build_user(self, cnx, eid):
+ """return a CWUser entity for user with the given eid"""
+ cls = self.vreg['etypes'].etype_class('CWUser')
+ st = cls.fetch_rqlst(cnx.user, ordermethod=None)
+ st.add_eid_restriction(st.get_variable('X'), 'x', 'Substitute')
+ rset = cnx.execute(st.as_string(), {'x': eid})
+ assert len(rset) == 1, rset
+ cwuser = rset.get_entity(0, 0)
+ # pylint: disable=W0104
+ # prefetch / cache cwuser's groups and properties. This is especially
+ # useful for internal sessions to avoid security insertions
+ cwuser.groups
+ cwuser.properties
+ return cwuser
+
+ # public (dbapi) interface ################################################
+
+ @deprecated("[3.19] use _cw.call_service('repo_stats')")
+ def stats(self): # XXX restrict to managers session?
+ """Return a dictionary containing some statistics about the repository
+ resources usage.
+
+ This is a public method, not requiring a session id.
+
+ This method is deprecated in favor of using _cw.call_service('repo_stats')
+ """
+ with self.internal_cnx() as cnx:
+ return cnx.call_service('repo_stats')
+
+ @deprecated("[3.19] use _cw.call_service('repo_gc_stats')")
+ def gc_stats(self, nmax=20):
+ """Return a dictionary containing some statistics about the repository
+ memory usage.
+
+ This is a public method, not requiring a session id.
+
+ nmax is the max number of (most) referenced object returned as
+ the 'referenced' result
+ """
+ with self.internal_cnx() as cnx:
+ return cnx.call_service('repo_gc_stats', nmax=nmax)
+
+ def get_schema(self):
+ """Return the instance schema.
+
+ This is a public method, not requiring a session id.
+ """
+ return self.schema
+
+ def get_cubes(self):
+ """Return the list of cubes used by this instance.
+
+ This is a public method, not requiring a session id.
+ """
+ versions = self.get_versions(not (self.config.creating
+ or self.config.repairing
+ or self.config.quick_start
+ or self.config.mode == 'test'))
+ cubes = list(versions)
+ cubes.remove('cubicweb')
+ return cubes
+
+ def get_option_value(self, option, foreid=None):
+ """Return the value for `option` in the configuration.
+
+ This is a public method, not requiring a session id.
+
+ `foreid` argument is deprecated and now useless (as of 3.19).
+ """
+ if foreid is not None:
+ warn('[3.19] foreid argument is deprecated', DeprecationWarning,
+ stacklevel=2)
+ # XXX we may want to check we don't give sensible information
+ return self.config[option]
+
+ @cached
+ def get_versions(self, checkversions=False):
+ """Return the a dictionary containing cubes used by this instance
+ as key with their version as value, including cubicweb version.
+
+ This is a public method, not requiring a session id.
+ """
+ from logilab.common.changelog import Version
+ vcconf = {}
+ with self.internal_cnx() as cnx:
+ for pk, version in cnx.execute(
+ 'Any K,V WHERE P is CWProperty, P value V, P pkey K, '
+ 'P pkey ~="system.version.%"', build_descr=False):
+ cube = pk.split('.')[-1]
+ # XXX cubicweb migration
+ if cube in CW_MIGRATION_MAP:
+ cube = CW_MIGRATION_MAP[cube]
+ version = Version(version)
+ vcconf[cube] = version
+ if checkversions:
+ if cube != 'cubicweb':
+ fsversion = self.config.cube_version(cube)
+ else:
+ fsversion = self.config.cubicweb_version()
+ if version < fsversion:
+ msg = ('instance has %s version %s but %s '
+ 'is installed. Run "cubicweb-ctl upgrade".')
+ raise ExecutionError(msg % (cube, version, fsversion))
+ return vcconf
+
+ @cached
+ def source_defs(self):
+ """Return the a dictionary containing source uris as value and a
+ dictionary describing each source as value.
+
+ This is a public method, not requiring a session id.
+ """
+ sources = {}
+ # remove sensitive information
+ for uri, source in self.sources_by_uri.items():
+ sources[uri] = source.public_config
+ return sources
+
+ def properties(self):
+ """Return a result set containing system wide properties.
+
+ This is a public method, not requiring a session id.
+ """
+ with self.internal_cnx() as cnx:
+ # don't use cnx.execute, we don't want rset.req set
+ return self.querier.execute(cnx, 'Any K,V WHERE P is CWProperty,'
+ 'P pkey K, P value V, NOT P for_user U',
+ build_descr=False)
+
+ @deprecated("[3.19] Use session.call_service('register_user') instead'")
+ def register_user(self, login, password, email=None, **kwargs):
+ """check a user with the given login exists, if not create it with the
+ given password. This method is designed to be used for anonymous
+ registration on public web site.
+ """
+ with self.internal_cnx() as cnx:
+ cnx.call_service('register_user', login=login, password=password,
+ email=email, **kwargs)
+ cnx.commit()
+
+ def find_users(self, fetch_attrs, **query_attrs):
+ """yield user attributes for cwusers matching the given query_attrs
+ (the result set cannot survive this method call)
+
+ This can be used by low-privileges account (anonymous comes to
+ mind).
+
+ `fetch_attrs`: tuple of attributes to be fetched
+ `query_attrs`: dict of attr/values to restrict the query
+ """
+ assert query_attrs
+ if not hasattr(self, '_cwuser_attrs'):
+ cwuser = self.schema['CWUser']
+ self._cwuser_attrs = set(str(rschema)
+ for rschema, _eschema in cwuser.attribute_definitions()
+ if not rschema.meta)
+ cwuserattrs = self._cwuser_attrs
+ for k in chain(fetch_attrs, query_attrs):
+ if k not in cwuserattrs:
+ raise Exception('bad input for find_user')
+ with self.internal_cnx() as cnx:
+ varmaker = rqlvar_maker()
+ vars = [(attr, next(varmaker)) for attr in fetch_attrs]
+ rql = 'Any %s WHERE X is CWUser, ' % ','.join(var[1] for var in vars)
+ rql += ','.join('X %s %s' % (var[0], var[1]) for var in vars) + ','
+ rset = cnx.execute(rql + ','.join('X %s %%(%s)s' % (attr, attr)
+ for attr in query_attrs),
+ query_attrs)
+ return rset.rows
+
+ def new_session(self, login, **kwargs):
+ """open a new session for a given user
+
+ raise `AuthenticationError` if the authentication failed
+ raise `ConnectionError` if we can't open a connection
+ """
+ cnxprops = kwargs.pop('cnxprops', None)
+ # use an internal connection
+ with self.internal_cnx() as cnx:
+ # try to get a user object
+ user = self.authenticate_user(cnx, login, **kwargs)
+ session = Session(user, self, cnxprops)
+ user._cw = user.cw_rset.req = session
+ user.cw_clear_relation_cache()
+ self._sessions[session.sessionid] = session
+ self.info('opened session %s for user %s', session.sessionid, login)
+ with session.new_cnx() as cnx:
+ self.hm.call_hooks('session_open', cnx)
+ # commit connection at this point in case write operation has been
+ # done during `session_open` hooks
+ cnx.commit()
+ return session
+
+ def connect(self, login, **kwargs):
+ """open a new session for a given user and return its sessionid """
+ return self.new_session(login, **kwargs).sessionid
+
+ def close(self, sessionid, txid=None, checkshuttingdown=True):
+ """close the session with the given id"""
+ session = self._get_session(sessionid, txid=txid,
+ checkshuttingdown=checkshuttingdown)
+ # operation uncommited before close are rolled back before hook is called
+ with session.new_cnx() as cnx:
+ self.hm.call_hooks('session_close', cnx)
+ # commit connection at this point in case write operation has been
+ # done during `session_close` hooks
+ cnx.commit()
+ session.close()
+ del self._sessions[sessionid]
+ self.info('closed session %s for user %s', sessionid, session.user.login)
+
+ # session handling ########################################################
+
+ def close_sessions(self):
+ """close every opened sessions"""
+ for sessionid in list(self._sessions):
+ try:
+ self.close(sessionid, checkshuttingdown=False)
+ except Exception: # XXX BaseException?
+ self.exception('error while closing session %s' % sessionid)
+
+ def clean_sessions(self):
+ """close sessions not used since an amount of time specified in the
+ configuration
+ """
+ mintime = time() - self.cleanup_session_time
+ self.debug('cleaning session unused since %s',
+ strftime('%H:%M:%S', localtime(mintime)))
+ nbclosed = 0
+ for session in self._sessions.values():
+ if session.timestamp < mintime:
+ self.close(session.sessionid)
+ nbclosed += 1
+ return nbclosed
+
+ @contextmanager
+ def internal_cnx(self):
+ """Context manager returning a Connection using internal user which have
+ every access rights on the repository.
+
+ Beware that unlike the older :meth:`internal_session`, internal
+ connections have all hooks beside security enabled.
+ """
+ with Session(InternalManager(), self) as session:
+ with session.new_cnx() as cnx:
+ cnx.user._cw = cnx # XXX remove when "vreg = user._cw.vreg"
+ # hack in entity.py is gone
+ with cnx.security_enabled(read=False, write=False):
+ yield cnx
+
+ def _get_session(self, sessionid, txid=None, checkshuttingdown=True):
+ """return the session associated with the given session identifier"""
+ if checkshuttingdown and self.shutting_down:
+ raise ShuttingDown('Repository is shutting down')
+ try:
+ session = self._sessions[sessionid]
+ except KeyError:
+ raise BadConnectionId('No such session %s' % sessionid)
+ return session
+
+ # data sources handling ###################################################
+ # * correspondance between eid and (type, source)
+ # * correspondance between eid and local id (i.e. specific to a given source)
+
+ def type_and_source_from_eid(self, eid, cnx):
+ """return a tuple `(type, extid, actual source uri)` for the entity of
+ the given `eid`
+ """
+ try:
+ eid = int(eid)
+ except ValueError:
+ raise UnknownEid(eid)
+ try:
+ return self._type_source_cache[eid]
+ except KeyError:
+ etype, extid, auri = self.system_source.eid_type_source(cnx, eid)
+ self._type_source_cache[eid] = (etype, extid, auri)
+ return etype, extid, auri
+
+ def clear_caches(self, eids):
+ etcache = self._type_source_cache
+ extidcache = self._extid_cache
+ rqlcache = self.querier._rql_cache
+ for eid in eids:
+ try:
+ etype, extid, auri = etcache.pop(int(eid)) # may be a string in some cases
+ rqlcache.pop( ('%s X WHERE X eid %s' % (etype, eid),), None)
+ extidcache.pop(extid, None)
+ except KeyError:
+ etype = None
+ rqlcache.pop( ('Any X WHERE X eid %s' % eid,), None)
+ self.system_source.clear_eid_cache(eid, etype)
+
+ def type_from_eid(self, eid, cnx):
+ """return the type of the entity with id <eid>"""
+ return self.type_and_source_from_eid(eid, cnx)[0]
+
+ def querier_cache_key(self, cnx, rql, args, eidkeys):
+ cachekey = [rql]
+ for key in sorted(eidkeys):
+ try:
+ etype = self.type_from_eid(args[key], cnx)
+ except KeyError:
+ raise QueryError('bad cache key %s (no value)' % key)
+ except TypeError:
+ raise QueryError('bad cache key %s (value: %r)' % (
+ key, args[key]))
+ cachekey.append(etype)
+ # ensure eid is correctly typed in args
+ args[key] = int(args[key])
+ return tuple(cachekey)
+
+ @deprecated('[3.22] use the new store API')
+ def extid2eid(self, source, extid, etype, cnx, insert=True,
+ sourceparams=None):
+ """Return eid from a local id. If the eid is a negative integer, that
+ means the entity is known but has been copied back to the system source
+ hence should be ignored.
+
+ If no record is found, ie the entity is not known yet:
+
+ 1. an eid is attributed
+
+ 2. the source's :meth:`before_entity_insertion` method is called to
+ build the entity instance
+
+ 3. unless source's :attr:`should_call_hooks` tell otherwise,
+ 'before_add_entity' hooks are called
+
+ 4. record is added into the system source
+
+ 5. the source's :meth:`after_entity_insertion` method is called to
+ complete building of the entity instance
+
+ 6. unless source's :attr:`should_call_hooks` tell otherwise,
+ 'before_add_entity' hooks are called
+ """
+ try:
+ return self._extid_cache[extid]
+ except KeyError:
+ pass
+ eid = self.system_source.extid2eid(cnx, extid)
+ if eid is not None:
+ self._extid_cache[extid] = eid
+ self._type_source_cache[eid] = (etype, extid, source.uri)
+ return eid
+ if not insert:
+ return
+ # no link between extid and eid, create one
+ # write query, ensure connection's mode is 'write' so connections
+ # won't be released until commit/rollback
+ try:
+ eid = self.system_source.create_eid(cnx)
+ self._extid_cache[extid] = eid
+ self._type_source_cache[eid] = (etype, extid, source.uri)
+ entity = source.before_entity_insertion(
+ cnx, extid, etype, eid, sourceparams)
+ if source.should_call_hooks:
+ # get back a copy of operation for later restore if
+ # necessary, see below
+ pending_operations = cnx.pending_operations[:]
+ self.hm.call_hooks('before_add_entity', cnx, entity=entity)
+ self.add_info(cnx, entity, source, extid)
+ source.after_entity_insertion(cnx, extid, entity, sourceparams)
+ if source.should_call_hooks:
+ self.hm.call_hooks('after_add_entity', cnx, entity=entity)
+ return eid
+ except Exception:
+ # XXX do some cleanup manually so that the transaction has a
+ # chance to be commited, with simply this entity discarded
+ self._extid_cache.pop(extid, None)
+ self._type_source_cache.pop(eid, None)
+ if 'entity' in locals():
+ hook.CleanupDeletedEidsCacheOp.get_instance(cnx).add_data(entity.eid)
+ self.system_source.delete_info_multi(cnx, [entity])
+ if source.should_call_hooks:
+ cnx.pending_operations = pending_operations
+ raise
+
+ def add_info(self, cnx, entity, source, extid=None):
+ """add type and source info for an eid into the system table,
+ and index the entity with the full text index
+ """
+ # begin by inserting eid/type/source/extid into the entities table
+ hook.CleanupNewEidsCacheOp.get_instance(cnx).add_data(entity.eid)
+ self.system_source.add_info(cnx, entity, source, extid)
+
+ def _delete_cascade_multi(self, cnx, entities):
+ """same as _delete_cascade but accepts a list of entities with
+ the same etype and belonging to the same source.
+ """
+ pendingrtypes = cnx.transaction_data.get('pendingrtypes', ())
+ # delete remaining relations: if user can delete the entity, he can
+ # delete all its relations without security checking
+ with cnx.security_enabled(read=False, write=False):
+ in_eids = ','.join([str(_e.eid) for _e in entities])
+ with cnx.running_hooks_ops():
+ for rschema, _, role in entities[0].e_schema.relation_definitions():
+ if rschema.rule:
+ continue # computed relation
+ rtype = rschema.type
+ if rtype in schema.VIRTUAL_RTYPES or rtype in pendingrtypes:
+ continue
+ if role == 'subject':
+ # don't skip inlined relation so they are regularly
+ # deleted and so hooks are correctly called
+ rql = 'DELETE X %s Y WHERE X eid IN (%s)' % (rtype, in_eids)
+ else:
+ rql = 'DELETE Y %s X WHERE X eid IN (%s)' % (rtype, in_eids)
+ try:
+ cnx.execute(rql, build_descr=False)
+ except ValidationError:
+ raise
+ except Unauthorized:
+ self.exception('Unauthorized exception while cascading delete for entity %s. '
+ 'RQL: %s.\nThis should not happen since security is disabled here.',
+ entities, rql)
+ raise
+ except Exception:
+ if self.config.mode == 'test':
+ raise
+ self.exception('error while cascading delete for entity %s. RQL: %s',
+ entities, rql)
+
+ def init_entity_caches(self, cnx, entity, source):
+ """add entity to connection entities cache and repo's extid cache.
+ Return entity's ext id if the source isn't the system source.
+ """
+ cnx.set_entity_cache(entity)
+ if source.uri == 'system':
+ extid = None
+ else:
+ extid = source.get_extid(entity)
+ self._extid_cache[str(extid)] = entity.eid
+ self._type_source_cache[entity.eid] = (entity.cw_etype, extid, source.uri)
+ return extid
+
+ def glob_add_entity(self, cnx, edited):
+ """add an entity to the repository
+
+ the entity eid should originally be None and a unique eid is assigned to
+ the entity instance
+ """
+ entity = edited.entity
+ entity._cw_is_saved = False # entity has an eid but is not yet saved
+ # init edited_attributes before calling before_add_entity hooks
+ entity.cw_edited = edited
+ source = self.system_source
+ # allocate an eid to the entity before calling hooks
+ entity.eid = self.system_source.create_eid(cnx)
+ # set caches asap
+ extid = self.init_entity_caches(cnx, entity, source)
+ if server.DEBUG & server.DBG_REPO:
+ print('ADD entity', self, entity.cw_etype, entity.eid, edited)
+ prefill_entity_caches(entity)
+ self.hm.call_hooks('before_add_entity', cnx, entity=entity)
+ relations = preprocess_inlined_relations(cnx, entity)
+ edited.set_defaults()
+ if cnx.is_hook_category_activated('integrity'):
+ edited.check(creation=True)
+ self.add_info(cnx, entity, source, extid)
+ try:
+ source.add_entity(cnx, entity)
+ except (UniqueTogetherError, ViolatedConstraint) as exc:
+ userhdlr = cnx.vreg['adapters'].select(
+ 'IUserFriendlyError', cnx, entity=entity, exc=exc)
+ userhdlr.raise_user_exception()
+ edited.saved = entity._cw_is_saved = True
+ # trigger after_add_entity after after_add_relation
+ self.hm.call_hooks('after_add_entity', cnx, entity=entity)
+ # call hooks for inlined relations
+ for attr, value in relations:
+ self.hm.call_hooks('before_add_relation', cnx,
+ eidfrom=entity.eid, rtype=attr, eidto=value)
+ self.hm.call_hooks('after_add_relation', cnx,
+ eidfrom=entity.eid, rtype=attr, eidto=value)
+ return entity.eid
+
+ def glob_update_entity(self, cnx, edited):
+ """replace an entity in the repository
+ the type and the eid of an entity must not be changed
+ """
+ entity = edited.entity
+ if server.DEBUG & server.DBG_REPO:
+ print('UPDATE entity', entity.cw_etype, entity.eid,
+ entity.cw_attr_cache, edited)
+ hm = self.hm
+ eschema = entity.e_schema
+ cnx.set_entity_cache(entity)
+ orig_edited = getattr(entity, 'cw_edited', None)
+ entity.cw_edited = edited
+ source = self.system_source
+ try:
+ only_inline_rels, need_fti_update = True, False
+ relations = []
+ for attr in list(edited):
+ if attr == 'eid':
+ continue
+ rschema = eschema.subjrels[attr]
+ if rschema.final:
+ if getattr(eschema.rdef(attr), 'fulltextindexed', False):
+ need_fti_update = True
+ only_inline_rels = False
+ else:
+ # inlined relation
+ previous_value = entity.related(attr) or None
+ if previous_value is not None:
+ previous_value = previous_value[0][0] # got a result set
+ if previous_value == entity.cw_attr_cache[attr]:
+ previous_value = None
+ else:
+ hm.call_hooks('before_delete_relation', cnx,
+ eidfrom=entity.eid, rtype=attr,
+ eidto=previous_value)
+ relations.append((attr, edited[attr], previous_value))
+ # call hooks for inlined relations
+ for attr, value, _t in relations:
+ hm.call_hooks('before_add_relation', cnx,
+ eidfrom=entity.eid, rtype=attr, eidto=value)
+ if not only_inline_rels:
+ hm.call_hooks('before_update_entity', cnx, entity=entity)
+ if cnx.is_hook_category_activated('integrity'):
+ edited.check()
+ try:
+ source.update_entity(cnx, entity)
+ edited.saved = True
+ except (UniqueTogetherError, ViolatedConstraint) as exc:
+ userhdlr = cnx.vreg['adapters'].select(
+ 'IUserFriendlyError', cnx, entity=entity, exc=exc)
+ userhdlr.raise_user_exception()
+ self.system_source.update_info(cnx, entity, need_fti_update)
+ if not only_inline_rels:
+ hm.call_hooks('after_update_entity', cnx, entity=entity)
+ for attr, value, prevvalue in relations:
+ # if the relation is already cached, update existant cache
+ relcache = entity.cw_relation_cached(attr, 'subject')
+ if prevvalue is not None:
+ hm.call_hooks('after_delete_relation', cnx,
+ eidfrom=entity.eid, rtype=attr, eidto=prevvalue)
+ if relcache is not None:
+ cnx.update_rel_cache_del(entity.eid, attr, prevvalue)
+ del_existing_rel_if_needed(cnx, entity.eid, attr, value)
+ cnx.update_rel_cache_add(entity.eid, attr, value)
+ hm.call_hooks('after_add_relation', cnx,
+ eidfrom=entity.eid, rtype=attr, eidto=value)
+ finally:
+ if orig_edited is not None:
+ entity.cw_edited = orig_edited
+
+
+ def glob_delete_entities(self, cnx, eids):
+ """delete a list of entities and all related entities from the repository"""
+ # mark eids as being deleted in cnx info and setup cache update
+ # operation (register pending eids before actual deletion to avoid
+ # multiple call to glob_delete_entities)
+ op = hook.CleanupDeletedEidsCacheOp.get_instance(cnx)
+ if not isinstance(eids, (set, frozenset)):
+ warn('[3.13] eids should be given as a set', DeprecationWarning,
+ stacklevel=2)
+ eids = frozenset(eids)
+ eids = eids - op._container
+ op._container |= eids
+ data_by_etype = {} # values are [list of entities]
+ #
+ # WARNING: the way this dictionary is populated is heavily optimized
+ # and does not use setdefault on purpose. Unless a new release
+ # of the Python interpreter advertises large perf improvements
+ # in setdefault, this should not be changed without profiling.
+ for eid in eids:
+ etype = self.type_from_eid(eid, cnx)
+ # XXX should cache entity's cw_metainformation
+ entity = cnx.entity_from_eid(eid, etype)
+ try:
+ data_by_etype[etype].append(entity)
+ except KeyError:
+ data_by_etype[etype] = [entity]
+ source = self.system_source
+ for etype, entities in data_by_etype.items():
+ if server.DEBUG & server.DBG_REPO:
+ print('DELETE entities', etype, [entity.eid for entity in entities])
+ self.hm.call_hooks('before_delete_entity', cnx, entities=entities)
+ self._delete_cascade_multi(cnx, entities)
+ source.delete_entities(cnx, entities)
+ source.delete_info_multi(cnx, entities)
+ self.hm.call_hooks('after_delete_entity', cnx, entities=entities)
+ # don't clear cache here, it is done in a hook on commit
+
+ def glob_add_relation(self, cnx, subject, rtype, object):
+ """add a relation to the repository"""
+ self.glob_add_relations(cnx, {rtype: [(subject, object)]})
+
+ def glob_add_relations(self, cnx, relations):
+ """add several relations to the repository
+
+ relations is a dictionary rtype: [(subj_eid, obj_eid), ...]
+ """
+ source = self.system_source
+ relations_by_rtype = {}
+ subjects_by_types = {}
+ objects_by_types = {}
+ activintegrity = cnx.is_hook_category_activated('activeintegrity')
+ for rtype, eids_subj_obj in relations.items():
+ if server.DEBUG & server.DBG_REPO:
+ for subjeid, objeid in eids_subj_obj:
+ print('ADD relation', subjeid, rtype, objeid)
+ for subjeid, objeid in eids_subj_obj:
+ if rtype in relations_by_rtype:
+ relations_by_rtype[rtype].append((subjeid, objeid))
+ else:
+ relations_by_rtype[rtype] = [(subjeid, objeid)]
+ if not activintegrity:
+ continue
+ # take care to relation of cardinality '?1', as all eids will
+ # be inserted later, we've remove duplicated eids since they
+ # won't be caught by `del_existing_rel_if_needed`
+ rdef = cnx.rtype_eids_rdef(rtype, subjeid, objeid)
+ card = rdef.cardinality
+ if card[0] in '?1':
+ with cnx.security_enabled(read=False):
+ cnx.execute('DELETE X %s Y WHERE X eid %%(x)s, '
+ 'NOT Y eid %%(y)s' % rtype,
+ {'x': subjeid, 'y': objeid})
+ subjects = subjects_by_types.setdefault(rdef, {})
+ if subjeid in subjects:
+ del relations_by_rtype[rtype][subjects[subjeid]]
+ subjects[subjeid] = len(relations_by_rtype[rtype]) - 1
+ continue
+ subjects[subjeid] = len(relations_by_rtype[rtype]) - 1
+ if card[1] in '?1':
+ with cnx.security_enabled(read=False):
+ cnx.execute('DELETE X %s Y WHERE Y eid %%(y)s, '
+ 'NOT X eid %%(x)s' % rtype,
+ {'x': subjeid, 'y': objeid})
+ objects = objects_by_types.setdefault(rdef, {})
+ if objeid in objects:
+ del relations_by_rtype[rtype][objects[objeid]]
+ objects[objeid] = len(relations_by_rtype[rtype])
+ continue
+ objects[objeid] = len(relations_by_rtype[rtype])
+ for rtype, source_relations in relations_by_rtype.items():
+ self.hm.call_hooks('before_add_relation', cnx,
+ rtype=rtype, eids_from_to=source_relations)
+ for rtype, source_relations in relations_by_rtype.items():
+ source.add_relations(cnx, rtype, source_relations)
+ rschema = self.schema.rschema(rtype)
+ for subjeid, objeid in source_relations:
+ cnx.update_rel_cache_add(subjeid, rtype, objeid, rschema.symmetric)
+ for rtype, source_relations in relations_by_rtype.items():
+ self.hm.call_hooks('after_add_relation', cnx,
+ rtype=rtype, eids_from_to=source_relations)
+
+ def glob_delete_relation(self, cnx, subject, rtype, object):
+ """delete a relation from the repository"""
+ if server.DEBUG & server.DBG_REPO:
+ print('DELETE relation', subject, rtype, object)
+ source = self.system_source
+ self.hm.call_hooks('before_delete_relation', cnx,
+ eidfrom=subject, rtype=rtype, eidto=object)
+ source.delete_relation(cnx, subject, rtype, object)
+ rschema = self.schema.rschema(rtype)
+ cnx.update_rel_cache_del(subject, rtype, object, rschema.symmetric)
+ self.hm.call_hooks('after_delete_relation', cnx,
+ eidfrom=subject, rtype=rtype, eidto=object)
+
+
+
+
+ # these are overridden by set_log_methods below
+ # only defining here to prevent pylint from complaining
+ info = warning = error = critical = exception = debug = lambda msg, *a, **kw: None
+
+from logging import getLogger
+from cubicweb import set_log_methods
+set_log_methods(Repository, getLogger('cubicweb.repository'))