mercurial-scm/hg: mercurial/cmdutil.py comparison

comparison mercurial/cmdutil.py @ 9925:9dfe34bf42c7

findrenames: first loop over the removed files, it's faster Getting the file from the working dir is less expensive than getting it from the repo history, hence the speedup. benchmarked on crew repo with: rm -rf * ; hg up -C ; for i in `find . -name "*.py"` ; do mv $i $i.new;done followed by: hg addremove -s 100 before: Time: real 68.760 secs (user 65.760+0.000 sys 2.490+0.000) after : Time: real 28.890 secs (user 26.920+0.000 sys 1.450+0.000)

author	Benoit Boissinot <benoit.boissinot@ens-lyon.org>
date	Tue, 24 Nov 2009 17:26:42 +0100
parents	2c2f7593ffc4
children	4b044b81cb54

comparison

equal deleted inserted replaced

-:3d718761157b
+:9dfe34bf42c7
 def matchfiles(repo, files):
 return _match.exact(repo.root, repo.getcwd(), files)
 def findrenames(repo, added, removed, threshold):
 '''find renamed files -- yields (before, after, score) tuples'''
+copies = {}
 ctx = repo['.']
-for a in added:
+for r in removed:
-aa = repo.wread(a)
+if r not in ctx:
-bestname, bestscore = None, threshold
+continue
-for r in removed:
+fctx = ctx.filectx(r)
-if r not in ctx:
+rr = fctx.data()
-continue
+for a in added:
-rr = ctx.filectx(r).data()
+bestscore = copies.get(a, (None, threshold))[1]
+aa = repo.wread(a)
 # bdiff.blocks() returns blocks of matching lines
 # count the number of bytes in each
 equal = 0
 alines = mdiff.splitnewlines(aa)
 matches = bdiff.blocks(aa, rr)
 lengths = len(aa) + len(rr)
 if lengths:
 myscore = equal*2.0 / lengths
 if myscore >= bestscore:
-bestname, bestscore = r, myscore
+copies[a] = (r, myscore)
-if bestname:
+for dest, v in copies.iteritems():
-yield bestname, a, bestscore
+source, score = v
+yield source, dest, score
 def addremove(repo, pats=[], opts={}, dry_run=None, similarity=None):
 if dry_run is None:
 dry_run = opts.get('dry_run')
 if similarity is None:

Mercurial > public > mercurial-scm > hg

comparison mercurial/cmdutil.py @ 9925:9dfe34bf42c7