evolve: comparison hgext3rd/evolve/obscache.py

equal deleted inserted replaced

-:d5de0529a48f
+:f787f5406a98
 return obsstore._all[firstmarker:]
 else:
 obsdata = obsstore.svfs.tryread('obsstore')
 return _readmarkers(obsdata, byteoffset)[1]
-class obscache(object):
-"""cache the "does a rev" is the precursors of some obsmarkers data
+class dualsourcecache(object):
+"""An abstract class for cache that needs both changelog and obsstore
-This is not directly holding the "is this revision obsolete" information,
-because phases data gets into play here. However, it allow to compute the
+This class handle the tracking of changelog and obsstore update. It provide
-"obsolescence" set without reading the obsstore content.
+data to performs incremental update (see the 'updatefrom' function for
+details).  This class can also detect stripping of the changelog or the
-Implementation note #1:
+obsstore and can reset the cache in this cache (see the 'clear' function
+for details).
-The obsstore is implementing only half of the transaction logic it
-should. It properly record the starting point of the obsstore to allow
-clean rollback. However it still write to the obsstore file directly
-during the transaction. Instead it should be keeping data in memory and
-write to a '.pending' file to make the data vailable for hooks.
-This cache is not going futher than what the obstore is doing, so it does
-not has any '.pending' logic. When the obsstore gains proper '.pending'
-support, adding it to this cache should not be too hard. As the flag
-always move from 0 to 1, we could have a second '.pending' cache file to
-be read. If flag is set in any of them, the value is 1. For the same
-reason, updating the file in place should be possible.
-Implementation note #2:
-Instead of having a large final update run, we could update this cache at
-the level adding a new changeset or a new obsmarkers. More on this in the
-'update code'.
-Implementation note #3:
-Storage-wise, we could have a "start rev" to avoid storing useless
-zero. That would be especially useful for the '.pending' overlay.
 """
-_filepath = 'cache/evoext-obscache-00'
+# default key used for an empty cache
-_headerformat = '>q20sQQ20s'
+#
+# The cache key covering the changesets and obsmarkers content
+#
+# The cache key parts are:
+# - tip-rev,
+# - tip-node,
+# - obsstore-length (nb markers),
+# - obsstore-file-size (in bytes),
+# - obsstore "cache key"
 emptykey = (node.nullrev, node.nullid, 0, 0, node.nullid)
-def __init__(self, repo):
+def __init__(self):
-self._vfs = repo.vfs
-# cache key covering the changesets and obsmarkers content
-#
-# It contains the following data. Combined with 'upgradeneeded' it allows to
-# do iterative upgrade for cache depending of theses two pieces of data.
-#
-# The cache key parts are"
-# - tip-rev,
-# - tip-node,
-# - obsstore-length (nb markers),
-# - obsstore-file-size (in bytes),
-# - obsstore "cache key"
 self._cachekey = None
-self._ondiskkey = None
-self._data = bytearray()
+def _updatefrom(self, repo, revs, obsmarkers):
+"""override this method to update your cache data incrementally
-def get(self, rev):
-"""return True if "rev" is used as "precursors for any obsmarkers
+revs:      list of new revision in the changelog
+obsmarker: list of new obsmarkers in the obsstore
-Make sure the cache has been updated to match the repository content before using it"""
+"""
-return self._data[rev]
+raise NotImplementedError
 def clear(self, reset=False):
-"""invalidate the cache content"""
+"""invalidate the cache content
+if 'reset' is passed, we detected a strip and the cache will have to be
+recomputed.
+"""
+# /!\ IMPORTANT /!\
+# You must overide this method to actually
 self._cachekey = self.emptykey if reset else None
-self._data = bytearray()
+# Useful public function (no need to override them)
+def uptodate(self, repo):
+"""return True if the cache content is up to date False otherwise
+This method can be used to detect of the cache is lagging behind new
+data in either changelog or obsstore.
+"""
+if self._cachekey is None:
+self.load(repo)
+status = self._checkkey(repo.changelog, repo.obsstore)
+return (status is not None
+and status[0] == self._cachekey[0] # tiprev
+and status[1] == self._cachekey[3]) # obssize
+def update(self, repo):
+"""update the cache with new repository data
+The update will be incremental when possible"""
+# If we do not have any data, try loading from disk
+if self._cachekey is None:
+self.load(repo)
+assert repo.filtername is None
+cl = repo.changelog
+upgrade = self._upgradeneeded(repo)
+if upgrade is None:
+return
+reset, revs, obsmarkers, obskeypair = upgrade
+if reset or self._cachekey is None:
+self.clear(reset=True)
+self._updatefrom(repo, revs, obsmarkers)
+# update the key from the new data
+key = list(self._cachekey)
+if revs:
+key[0] = len(cl) - 1
+key[1] = cl.node(key[0])
+if obsmarkers:
+key[2] += len(obsmarkers)
+key[3], key[4] = obskeypair
+self._cachekey = tuple(key)
+# from here, there are internal function only
 def _checkkey(self, changelog, obsstore):
 """internal function"""
 key = self._cachekey
 if key is None:
 obssize, obskey = obsstore.cachekey(index=keyobssize)
 if obskey != keyobskey:
 return None
 return tiprev, obssize, obskey
-def uptodate(self, repo):
+def _upgradeneeded(self, repo):
-if self._cachekey is None:
-self.load(repo)
-status = self._checkkey(repo.changelog, repo.obsstore)
-return (status is not None
-and status[0] == self._cachekey[0] # tiprev
-and status[1] == self._cachekey[3]) # obssize
-def upgradeneeded(self, repo):
 """return (valid, start-rev, start-obs-idx)
 'valid': is "False" if older cache value needs invalidation,
 'start-rev': first revision not in the cache. None if cache is up to date,
 # requirement (or fix the race, that is not too hard).
 markers = markersfrom(obsstore, keyobssize, keyobslength)
 return reset, revs, markers, (obssize, obskey)
-def update(self, repo):
-"""Iteratively update the cache with new repository data"""
+class obscache(dualsourcecache):
-# If we do not have any data, try loading from disk
+"""cache the "does a rev" is the precursors of some obsmarkers data
-if self._cachekey is None:
-self.load(repo)
+This is not directly holding the "is this revision obsolete" information,
+because phases data gets into play here. However, it allow to compute the
-assert repo.filtername is None
+"obsolescence" set without reading the obsstore content.
-cl = repo.changelog
+Implementation note #1:
-upgrade = self.upgradeneeded(repo)
-if upgrade is None:
+The obsstore is implementing only half of the transaction logic it
-return
+should. It properly record the starting point of the obsstore to allow
+clean rollback. However it still write to the obsstore file directly
-reset, revs, obsmarkers, obskeypair = upgrade
+during the transaction. Instead it should be keeping data in memory and
-if reset or self._cachekey is None:
+write to a '.pending' file to make the data vailable for hooks.
-self.clear(reset=True)
+This cache is not going futher than what the obstore is doing, so it does
-def _updatefrom(repo, revs, obsmarkers)
+not has any '.pending' logic. When the obsstore gains proper '.pending'
+support, adding it to this cache should not be too hard. As the flag
-# update the key from the new data
+always move from 0 to 1, we could have a second '.pending' cache file to
-key = list(self._cachekey)
+be read. If flag is set in any of them, the value is 1. For the same
-if revs:
+reason, updating the file in place should be possible.
-key[0] = len(cl) - 1
-key[1] = cl.node(key[0])
+Implementation note #2:
-if obsmarkers:
-key[2] += len(obsmarkers)
+Instead of having a large final update run, we could update this cache at
-key[3], key[4] = obskeypair
+the level adding a new changeset or a new obsmarkers. More on this in the
-self._cachekey = tuple(key)
+'update code'.
+Implementation note #3:
+Storage-wise, we could have a "start rev" to avoid storing useless
+zero. That would be especially useful for the '.pending' overlay.
+"""
+_filepath = 'cache/evoext-obscache-00'
+_headerformat = '>q20sQQ20s'
+emptykey = (node.nullrev, node.nullid, 0, 0, node.nullid)
+def __init__(self, repo):
+super(obscache, self).__init__()
+self._ondiskkey = None
+self._vfs = repo.vfs
+self._data = bytearray()
+def get(self, rev):
+"""return True if "rev" is used as "precursors for any obsmarkers
+Make sure the cache has been updated to match the repository content before using it"""
+return self._data[rev]
+def clear(self, reset=False):
+"""invalidate the cache content"""
+super(obscache, self).clear(reset=reset)
+self._data = bytearray()
 def _updatefrom(self, repo, revs, obsmarkers):
 if revs:
 self._updaterevs(repo, revs)
 if obsmarkers:

changeset 2357	f787f5406a98
parent 2356	d5de0529a48f
child 2359	ff635fa59a25