[PATCH 1 of 1] compare grep result between target and its parent
Martin Geisler
mg at lazybytes.net
Sat Jun 20 14:53:07 UTC 2009
# HG changeset patch
# User FUJIWARA Katsunori <foozy at lares.dti.ne.jp>
# Date 1242719394 -32400
# Node ID 929a959f70f71c4fc1e406cc8ad991236dca017d
# Parent 7951f385fcb71f9b684ceb467d37aa43ddecefda
compare grep result between target and its parent
I found that typical case is that grep target is added at (*) revision
in the tree shown below.
+--- 1(*) --- 3
0
+--- 2 ------ 4
Now, I expect 'hg grep --all' to show only rev:1 which is first
appearance of target line.
But 'hg grep --all' will tell:
target line dis-appeared at 3 => 4
target line appeared at 2 => 3
target line dis-appeared at 1 => 2
target line appeared at 0 => 1
because current 'hg grep' implementation compares not between target
revision and its parent, but between neighbor revisions in walkthrough
order.
I checked performance of this patch by "hg grep --follow --all
walkchangerevs" on whole Mercurial repo, and patched version could
complete as fast as un-patched one.
diff --git a/mercurial/commands.py b/mercurial/commands.py
--- a/mercurial/commands.py
+++ b/mercurial/commands.py
@@ -1230,16 +1230,14 @@
for i in xrange(blo, bhi):
yield ('+', b[i])
- prev = {}
- def display(fn, rev, states, prevstates):
+ def display(fn, r, pstates, states):
datefunc = ui.quiet and util.shortdate or util.datestr
found = False
filerevmatches = {}
- r = prev.get(fn, -1)
if opts.get('all'):
- iter = difflinestates(states, prevstates)
+ iter = difflinestates(pstates, states)
else:
- iter = [('', l) for l in prevstates]
+ iter = [('', l) for l in states]
for change, l in iter:
cols = [fn, str(r)]
if opts.get('line_number'):
@@ -1261,8 +1259,8 @@
found = True
return found
- fstate = {}
skip = {}
+ revfiles = {}
get = util.cachefunc(lambda r: repo[r].changeset())
changeiter, matchfn = cmdutil.walkchangerevs(ui, repo, pats, get, opts)
found = False
@@ -1270,46 +1268,58 @@
for st, rev, fns in changeiter:
if st == 'window':
matches.clear()
+ revfiles.clear()
elif st == 'add':
ctx = repo[rev]
- matches[rev] = {}
+ pctx = ctx.parents()[0]
+ parent = pctx.rev()
+ matches.setdefault(rev, {})
+ matches.setdefault(parent, {})
+ files = revfiles.setdefault(rev, [])
for fn in fns:
+ flog = getfile(fn)
+ try:
+ fnode = ctx.filenode(fn)
+ except error.LookupError:
+ continue
+
+ copied = flog.renamed(fnode)
+ copy = follow and copied and copied[0]
+ if copy:
+ copies.setdefault(rev, {})[fn] = copy
if fn in skip:
+ if copy:
+ skip[copy] = True
continue
- try:
- grepbody(fn, rev, getfile(fn).read(ctx.filenode(fn)))
- fstate.setdefault(fn, [])
- if follow:
- copied = getfile(fn).renamed(ctx.filenode(fn))
- if copied:
- copies.setdefault(rev, {})[fn] = copied[0]
- except error.LookupError:
- pass
+ files.append(fn)
+
+ if not matches[rev].has_key(fn):
+ grepbody(fn, rev, flog.read(fnode))
+
+ pfn = copy or fn
+ if not matches[parent].has_key(pfn):
+ try:
+ fnode = pctx.filenode(pfn)
+ grepbody(pfn, parent, flog.read(fnode))
+ except error.LookupError:
+ pass
elif st == 'iter':
- for fn, m in sorted(matches[rev].items()):
+ parent = repo[rev].parents()[0].rev()
+ for fn in sorted(revfiles.get(rev, [])):
+ states = matches[rev][fn]
copy = copies.get(rev, {}).get(fn)
if fn in skip:
if copy:
skip[copy] = True
continue
- if fn in prev or fstate[fn]:
- r = display(fn, rev, m, fstate[fn])
+ pstates = matches.get(parent, {}).get(copy or fn, [])
+ if pstates or states:
+ r = display(fn, rev, pstates, states)
found = found or r
if r and not opts.get('all'):
skip[fn] = True
if copy:
skip[copy] = True
- fstate[fn] = m
- if copy:
- fstate[copy] = m
- prev[fn] = rev
-
- for fn, state in sorted(fstate.items()):
- if fn in skip:
- continue
- if fn not in copies.get(prev[fn], {}):
- found = display(fn, rev, {}, state) or found
- return (not found and 1) or 0
def heads(ui, repo, *branchrevs, **opts):
"""show current repository heads or show branch heads
More information about the Mercurial-devel
mailing list