mercurial-scm/hg: mercurial/revlogutils/deltas.py comparison

comparison mercurial/revlogutils/deltas.py @ 41109:3e1960e23e6b

delta: reuse _findsnapshot call from previous stage Two different stage of the sparse-revlog logic needs the _findsnapshot data. To avoid recomputing it twice, make it possible to reuse the first computation in the second step. example affected manifest write before: 0.067141s after: 0.064252s (-5%) (total gain since start of series: 95%)

author	Boris Feld <boris.feld@octobus.net>
date	Thu, 20 Dec 2018 10:16:24 +0100
parents	38e88450138c
children	189e06b2d719

comparison

equal deleted inserted replaced

-:38e88450138c
+:3e1960e23e6b
 # build delta will reuse the cache
 good = yield (cachedelta[0],)
 if good is not None:
 yield None
 return
-for candidates in _rawgroups(revlog, p1, p2, cachedelta):
+snapshots = collections.defaultdict(list)
+for candidates in _rawgroups(revlog, p1, p2, cachedelta, snapshots):
 good = yield candidates
 if good is not None:
 break
 # If sparse revlog is enabled, we can try to refine the available deltas
 base = revlog.deltaparent(good)
 if base == nullrev:
 break
 good = yield (base,)
 # refine snapshot up
-#
+if not snapshots:
-# XXX the _findsnapshots call can be expensive and is "duplicated" with
+_findsnapshots(revlog, snapshots, good + 1)
-# the one done in `_rawgroups`. Once we start working on performance,
-# we should make the two logics share this computation.
-snapshots = collections.defaultdict(list)
-_findsnapshots(revlog, snapshots, good + 1)
 previous = None
 while good != previous:
 previous = good
 children = tuple(sorted(c for c in snapshots[good]))
 good = yield children
 # we have found nothing
 yield None
-def _rawgroups(revlog, p1, p2, cachedelta):
+def _rawgroups(revlog, p1, p2, cachedelta, snapshots=None):
 """Provides group of revision to be tested as delta base
 This lower level function focus on emitting delta theorically interresting
 without looking it any practical details.
 elif len(parents) > 0:
 # Test all parents (1 or 2), and keep the best candidate
 yield parents
 if sparse and parents:
-snapshots = collections.defaultdict(list) # map: base-rev: snapshot-rev
+if snapshots is None:
+# map: base-rev: snapshot-rev
+snapshots = collections.defaultdict(list)
 # See if we can use an existing snapshot in the parent chains to use as
 # a base for a new intermediate-snapshot
 #
 # search for snapshot in parents delta chain
 # map: snapshot-level: snapshot-rev

Mercurial > public > mercurial-scm > hg

comparison mercurial/revlogutils/deltas.py @ 41109:3e1960e23e6b