mercurial-scm/hg-stable: tests/artifacts/scripts/generate-churning-bundle.py comparison

comparison tests/artifacts/scripts/generate-churning-bundle.py @ 52469:9feb175c028d

test-sparse-revlog: build the content directly in memory We now do our own merge so that we now have the graph and the content fully defined. Which will help to speed up the generation soon. The generation jump through a few hoops to avoid consuming 700MB of memory at run time.

author	Pierre-Yves David <pierre-yves.david@octobus.net>
date	Wed, 04 Dec 2024 10:34:17 +0100
parents	e26b738430a1
children	83f87912c5e0

comparison

equal deleted inserted replaced

-:e26b738430a1
+:9feb175c028d
 else:
 to_write = oldcontent[idx]
 yield to_write
-def updatefile(filename, idx):
+def merge_content(base, left, right):
-"""update <filename> to be at appropriate content for iteration <idx>"""
+"""merge two file content to produce a new one
-existing = None
-if idx > 0:
+use unambiguous update on each side when possible, and produce a new line
-with open(filename, 'rb') as old:
+whenever a merge is needed. Similar to what the manifest would do.
-existing = old.readlines()
+"""
-with open(filename, 'wb') as target:
+for old, left, right in zip(base, left, right):
-for line in filecontent(idx, existing):
+if old == left and old == right:
-target.write(line)
+yield old
+elif old == left and old != right:
+yield right
+elif old != left and old == right:
+yield left
+else:
+yield nextcontent(left + right)
+def ancestors(graph, rev):
+"""return the set of ancestors of revision <rev>"""
+to_proceed = {rev}
+seen = set(to_proceed)
+while to_proceed:
+current = to_proceed.pop()
+for p in graph[current]:
+if p is None:
+continue
+if p in seen:
+continue
+to_proceed.add(p)
+seen.add(p)
+return seen
+def gca(graph, left, right):
+"""find the greater common ancestors of left and right
+Note that the algorithm is stupid and N² when run on all merge, however
+this should not be a too much issue given the current scale.
+"""
+return max(ancestors(graph, left) & ancestors(graph, right))
+def make_one_content_fn(idx, base, left, right):
+"""build a function that build the content on demand
+The dependency are kept are reference to make sure they are not
+garbage-collected until we use them. Once we computed the current content,
+we make sure to drop their reference to allow them to be garbage collected.
+"""
+def content_fn(idx=idx, base=base, left=left, right=right):
+if left is None:
+new = filecontent(idx, None)
+elif base is None:
+new = filecontent(idx, left())
+else:
+merged = merge_content(base(), left(), right())
+new = filecontent(idx, list(merged))
+return list(new)
+del idx
+del base
+del left
+del right
+value = None
+cf = [content_fn]
+del content_fn
+def final_fn():
+nonlocal value
+if value is None:
+content_fn = cf.pop()
+value = list(content_fn())
+del content_fn
+return value
+return final_fn
+def build_content_graph(graph):
+"""produce file content for all revision
+The content will be generated on demande and cached. Cleanup the
+dictionnary are you use it to reduce memory usage.
+"""
+content = {}
+for idx, (p1, p2) in graph.items():
+base = left = right = None
+if p1 is not None:
+left = content[p1]
+if p2 is not None:
+right = content[p2]
+base_rev = gca(graph, p1, p2)
+base = content[base_rev]
+content[idx] = make_one_content_fn(idx, base, left, right)
+return content
+CONTENT = build_content_graph(GRAPH)
 def hg(command, *args):
 """call a mercurial command with appropriate config and argument"""
 env = os.environ.copy()
 print("generating commit #%d/%d" % (idx, NB_CHANGESET))
 if p1 is not None and p1 != idx - 1:
 hg('update', "%d" % p1)
 if p2 is not None:
 hg('merge', "%d" % p2)
-updatefile(FILENAME, idx)
+with open(FILENAME, 'wb') as f:
+# pop the value to let it be garbage collection eventually.
+for line in CONTENT.pop(idx)():
+f.write(line)
 if idx == 0:
 hg('add', FILENAME)
 hg('commit', '--addremove', '--message', 'initial commit')
 else:
 hg('commit', '--message', 'commit #%d' % idx)

Mercurial > public > mercurial-scm > hg-stable

comparison tests/artifacts/scripts/generate-churning-bundle.py @ 52469:9feb175c028d