mercurial-scm/hg: contrib/check-code.py comparison

comparison contrib/check-code.py @ 15372:695ac6aca77f stable

check-code: fix issues with finding patterns in unified tests, fix tests - old-style patterns without ^ were getting improperly anchored - finditer was matching against beginning of line poorly - \s was matching newlines - [^x] was matching newlines so we: - remove earlier hacks for multiline matching - fix unified test anchoring by adding .* - replace \s with [ \t] - replace [^x] with [^\nx] - force all matches into multiline mode so ^ anchors work This uncovers a number of test issues that are then repaired.

author	Matt Mackall <mpm@selenic.com>
date	Thu, 27 Oct 2011 17:22:04 -0500
parents	572c22c88be6
children	3bece03bf3c6

comparison

equal deleted inserted replaced

-:f26ed4ea46d8
+:695ac6aca77f
 testpats = [
 [
 (r'(pushd|popd)', "don't use 'pushd' or 'popd', use 'cd'"),
 (r'\W\$?\(\([^\)\n]*\)\)', "don't use (()) or $(()), use 'expr'"),
-(r'(^|\n)function', "don't use 'function', use old style"),
+(r'^function', "don't use 'function', use old style"),
 (r'grep.*-q', "don't use 'grep -q', redirect to /dev/null"),
 (r'echo.*\\n', "don't use 'echo \\n', use printf"),
 (r'echo -n', "don't use 'echo -n', use printf"),
-(r'(^|\n)diff.*-\w*N', "don't use 'diff -N'"),
+(r'^diff.*-\w*N', "don't use 'diff -N'"),
-(r'(^| )wc[^|\n]*$', "filter wc output"),
+(r'(^| )wc[^|]*$\n(?!.*\(re\))', "filter wc output"),
 (r'head -c', "don't use 'head -c', use 'dd'"),
 (r'ls.*-\w*R', "don't use 'ls -R', use 'find'"),
 (r'printf.*\\\d\d\d', "don't use 'printf \NNN', use Python"),
 (r'printf.*\\x', "don't use printf \\x, use Python"),
 (r'\$\(.*\)', "don't use $(expr), use `expr`"),
 (r'rm -rf \*', "don't use naked rm -rf, target a directory"),
-(r'(^|\|\s*)grep (-\w\s+)*[^|\n]*[(|]\w',
+(r'(^|\|\s*)grep (-\w\s+)*[^|]*[(|]\w',
 "use egrep for extended grep syntax"),
 (r'/bin/', "don't use explicit paths for tools"),
 (r'\$PWD', "don't use $PWD, use `pwd`"),
 (r'[^\n]\Z', "no trailing newline"),
 (r'export.*=', "don't export and assign at once"),
-('(^|\n)([^"\'\n]|("[^"\n]*")|(\'[^\'\n]*\'))*\\^', "^ must be quoted"),
+(r'^([^"\'\n]|("[^"\n]*")|(\'[^\'\n]*\'))*\\^', "^ must be quoted"),
-(r'(^|\n)source\b', "don't use 'source', use '.'"),
+(r'^source\b', "don't use 'source', use '.'"),
 (r'touch -d', "don't use 'touch -d', use 'touch -t' instead"),
 (r'ls +[^|\n-]+ +-', "options to 'ls' must come before filenames"),
 (r'[^>\n]>\s*\$HGRCPATH', "don't overwrite $HGRCPATH, append to it"),
-(r'stop\(\)', "don't use 'stop' as a shell function name"),
+(r'^stop\(\)', "don't use 'stop' as a shell function name"),
 (r'(\[|\btest\b).*-e ', "don't use 'test -e', use 'test -f'"),
 ],
 # warnings
 []
 ]
 testfilters = [
 (r"( *)(#([^\n]*\S)?)", repcomment),
 (r"<<(\S+)((.|\n)*?\n\1)", rephere),
 ]
-uprefix = r"(^|\n)  \$\s*"
+uprefix = r"^  \$ "
-uprefixc = r"(^|\n)  > "
+uprefixc = r"^  > "
 utestpats = [
 [
-(r'(^|\n)(\S|  $ ).*(\S[ \t]+|^[ \t]+)\n', "trailing whitespace on non-output"),
+(r'^(\S|  $ ).*(\S[ \t]+|^[ \t]+)\n', "trailing whitespace on non-output"),
 (uprefix + r'.*\|\s*sed', "use regex test output patterns instead of sed"),
 (uprefix + r'(true|exit 0)', "explicit zero exit unnecessary"),
 (uprefix + r'.*\$\?', "explicit exit code checks unnecessary"),
 (uprefix + r'.*\|\| echo.*(fail|error)',
 "explicit exit code checks unnecessary"),
 []
 ]
 for i in [0, 1]:
 for p, m in testpats[i]:
-if p.startswith(r'(^|\n)'):
+if p.startswith(r'^'):
-p = uprefix + p[6:]
+p = uprefix + p[1:]
 else:
-p = uprefix + p
+p = uprefix + ".*" + p
 utestpats[i].append((p, m))
 utestfilters = [
 (r"( *)(#([^\n]*\S)?)", repcomment),
 ]
 (r'^\s*\t', "don't use tabs"),
 (r'\S;\s*\n', "semicolon"),
 (r'\w,\w', "missing whitespace after ,"),
 (r'\w[+/*\-<>]\w', "missing whitespace in expression"),
 (r'^\s+\w+=\w+[^,)\n]$', "missing whitespace in assignment"),
-(r'(?m)(\s+)try:\n((?:\n|\1\s.*\n)+?)\1except.*?:\n'
+(r'(\s+)try:\n((?:\n|\1\s.*\n)+?)\1except.*?:\n'
 r'((?:\n|\1\s.*\n)+?)\1finally:', 'no try/except/finally in Py2.4'),
 (r'.{85}', "line too long"),
-(r'(?m) x+[xo][\'"]\n\s+[\'"]x', 'string join across lines with no space'),
+(r' x+[xo][\'"]\n\s+[\'"]x', 'string join across lines with no space'),
 (r'[^\n]\Z', "no trailing newline"),
 (r'(\S[ \t]+|^[ \t]+)\n', "trailing whitespace"),
 #    (r'^\s+[^_ \n][^_. \n]+_[^_\n]+\s*=', "don't use underbars in identifiers"),
 #    (r'\w*[a-z][A-Z]\w*\s*=', "don't use camelcase in identifiers"),
 (r'^\s*(if|while|def|class|except|try)\s[^[\n]*:\s*[^\\n]#\s]+',
 print "Checking %s for %s" % (name, f)
 prelines = None
 errors = []
 for p, msg in pats:
+# fix-up regexes for multiline searches
+po = p
+# \s doesn't match \n
+p = re.sub(r'(?<!\\)\\s', r'[ \\t]', p)
+# [^...] doesn't match newline
+p = re.sub(r'(?<!\\)\[\^', r'[^\\n', p)
+#print po, '=>', p
 pos = 0
 n = 0
-for m in re.finditer(p, post):
+for m in re.finditer(p, post, re.MULTILINE):
 if prelines is None:
 prelines = pre.splitlines()
 postlines = post.splitlines(True)
 start = m.start()

Mercurial > public > mercurial-scm > hg

comparison contrib/check-code.py @ 15372:695ac6aca77f stable