upstream/mercurial-mirror Commit - r18960:170fc094

1

#!/usr/bin/env python

1

#!/usr/bin/env python

2

#

2

#

3

# check-code - a style and portability checker for Mercurial

3

# check-code - a style and portability checker for Mercurial

4

#

4

#

5

6

#

6

#

7

# This software may be used and distributed according to the terms of the

7

# This software may be used and distributed according to the terms of the

8

# GNU General Public License version 2 or any later version.

8

# GNU General Public License version 2 or any later version.

9

10

import re, glob, os, sys

10

import re, glob, os, sys

11

import keyword

11

import keyword

12

import optparse

12

import optparse

13

14

def repquote(m):

14

def repquote(m):

15

t = re.sub(r"\w", "x", m.group('text'))

15

t = re.sub(r"\w", "x", m.group('text'))

16

t = re.sub(r"[^\s\nx]", "o", t)

16

t = re.sub(r"[^\s\nx]", "o", t)

17

return m.group('quote') + t + m.group('quote')

17

return m.group('quote') + t + m.group('quote')

18

19

def reppython(m):

19

def reppython(m):

20

comment = m.group('comment')

20

comment = m.group('comment')

21

if comment:

21

if comment:

22

l = len(comment.rstrip())

22

l = len(comment.rstrip())

23

return "#" * l + comment[l:]

23

return "#" * l + comment[l:]

24

return repquote(m)

24

return repquote(m)

25

26

def repcomment(m):

26

def repcomment(m):

27

return m.group(1) + "#" * len(m.group(2))

27

return m.group(1) + "#" * len(m.group(2))

28

29

def repccomment(m):

29

def repccomment(m):

30

t = re.sub(r"((?<=\n) )|\S", "x", m.group(2))

30

t = re.sub(r"((?<=\n) )|\S", "x", m.group(2))

31

return m.group(1) + t + "*/"

31

return m.group(1) + t + "*/"

32

33

def repcallspaces(m):

33

def repcallspaces(m):

34

t = re.sub(r"\n\s+", "\n", m.group(2))

34

t = re.sub(r"\n\s+", "\n", m.group(2))

35

return m.group(1) + t

35

return m.group(1) + t

36

37

def repinclude(m):

37

def repinclude(m):

38

return m.group(1) + "<foo>"

38

return m.group(1) + "<foo>"

39

40

def rephere(m):

40

def rephere(m):

41

t = re.sub(r"\S", "x", m.group(2))

41

t = re.sub(r"\S", "x", m.group(2))

42

return m.group(1) + t

42

return m.group(1) + t

43

44

45

testpats = [

45

testpats = [

46

[

46

[

47

(r'pushd|popd', "don't use 'pushd' or 'popd', use 'cd'"),

47

(r'pushd|popd', "don't use 'pushd' or 'popd', use 'cd'"),

48

(r'\W\$?$\([^$\n]*\)\)', "don't use (()) or $(()), use 'expr'"),

48

(r'\W\$?$\([^$\n]*\)\)', "don't use (()) or $(()), use 'expr'"),

49

(r'grep.*-q', "don't use 'grep -q', redirect to /dev/null"),

49

(r'grep.*-q', "don't use 'grep -q', redirect to /dev/null"),

50

(r'sed.*-i', "don't use 'sed -i', use a temporary file"),

50

(r'sed.*-i', "don't use 'sed -i', use a temporary file"),

51

(r'\becho\b.*\\n', "don't use 'echo \\n', use printf"),

51

(r'\becho\b.*\\n', "don't use 'echo \\n', use printf"),

52

(r'echo -n', "don't use 'echo -n', use printf"),

52

(r'echo -n', "don't use 'echo -n', use printf"),

53

(r'(^| )wc[^|]*$\n(?!.*$re$)', "filter wc output"),

53

(r'(^| )wc[^|]*$\n(?!.*$re$)', "filter wc output"),

54

(r'head -c', "don't use 'head -c', use 'dd'"),

54

(r'head -c', "don't use 'head -c', use 'dd'"),

55

(r'sha1sum', "don't use sha1sum, use $TESTDIR/md5sum.py"),

55

(r'sha1sum', "don't use sha1sum, use $TESTDIR/md5sum.py"),

56

(r'ls.*-\w*R', "don't use 'ls -R', use 'find'"),

56

(r'ls.*-\w*R', "don't use 'ls -R', use 'find'"),

57

(r'printf.*\\([1-9]|0\d)', "don't use 'printf \NNN', use Python"),

57

(r'printf.*\\([1-9]|0\d)', "don't use 'printf \NNN', use Python"),

58

(r'printf.*\\x', "don't use printf \\x, use Python"),

58

(r'printf.*\\x', "don't use printf \\x, use Python"),

59

(r'\$$.*$', "don't use $(expr), use `expr`"),

59

(r'\$$.*$', "don't use $(expr), use `expr`"),

60

(r'rm -rf \*', "don't use naked rm -rf, target a directory"),

60

(r'rm -rf \*', "don't use naked rm -rf, target a directory"),

61

(r'(^|\|\s*)grep (-\w\s+)*[^|]*[(|]\w',

61

(r'(^|\|\s*)grep (-\w\s+)*[^|]*[(|]\w',

62

"use egrep for extended grep syntax"),

62

"use egrep for extended grep syntax"),

63

(r'/bin/', "don't use explicit paths for tools"),

63

(r'/bin/', "don't use explicit paths for tools"),

64

(r'[^\n]\Z', "no trailing newline"),

64

(r'[^\n]\Z', "no trailing newline"),

65

(r'export.*=', "don't export and assign at once"),

65

(r'export.*=', "don't export and assign at once"),

66

(r'^source\b', "don't use 'source', use '.'"),

66

(r'^source\b', "don't use 'source', use '.'"),

67

(r'touch -d', "don't use 'touch -d', use 'touch -t' instead"),

67

(r'touch -d', "don't use 'touch -d', use 'touch -t' instead"),

68

(r'ls +[^|\n-]+ +-', "options to 'ls' must come before filenames"),

68

(r'ls +[^|\n-]+ +-', "options to 'ls' must come before filenames"),

69

(r'[^>\n]>\s*\$HGRCPATH', "don't overwrite $HGRCPATH, append to it"),

69

(r'[^>\n]>\s*\$HGRCPATH', "don't overwrite $HGRCPATH, append to it"),

70

(r'^stop', "don't use 'stop' as a shell function name"),

70

(r'^stop', "don't use 'stop' as a shell function name"),

71

(r'(\[|\btest\b).*-e ', "don't use 'test -e', use 'test -f'"),

71

(r'(\[|\btest\b).*-e ', "don't use 'test -e', use 'test -f'"),

72

(r'^alias\b.*=', "don't use alias, use a function"),

72

(r'^alias\b.*=', "don't use alias, use a function"),

73

(r'if\s*!', "don't use '!' to negate exit status"),

73

(r'if\s*!', "don't use '!' to negate exit status"),

74

(r'/dev/u?random', "don't use entropy, use /dev/zero"),

74

(r'/dev/u?random', "don't use entropy, use /dev/zero"),

75

(r'do\s*true;\s*done', "don't use true as loop body, use sleep 0"),

75

(r'do\s*true;\s*done', "don't use true as loop body, use sleep 0"),

76

(r'^( *)\t', "don't use tabs to indent"),

76

(r'^( *)\t', "don't use tabs to indent"),

77

],

77

],

78

# warnings

78

# warnings

79

[

79

[

80

(r'^function', "don't use 'function', use old style"),

80

(r'^function', "don't use 'function', use old style"),

81

(r'^diff.*-\w*N', "don't use 'diff -N'"),

81

(r'^diff.*-\w*N', "don't use 'diff -N'"),

82

(r'\$PWD|\${PWD}', "don't use $PWD, use `pwd`"),

82

(r'\$PWD|\${PWD}', "don't use $PWD, use `pwd`"),

83

(r'^([^"\'\n]|("[^"\n]*")|(\'[^\'\n]*\'))*\^', "^ must be quoted"),

83

(r'^([^"\'\n]|("[^"\n]*")|(\'[^\'\n]*\'))*\^', "^ must be quoted"),

84

(r'kill (`|\$\()', "don't use kill, use killdaemons.py")

84

(r'kill (`|\$\()', "don't use kill, use killdaemons.py")

85

]

85

]

86

]

86

]

87

88

testfilters = [

88

testfilters = [

89

(r"( *)(#([^\n]*\S)?)", repcomment),

89

(r"( *)(#([^\n]*\S)?)", repcomment),

90

(r"<<(\S+)((.|\n)*?\n\1)", rephere),

90

(r"<<(\S+)((.|\n)*?\n\1)", rephere),

91

]

91

]

92

93

winglobmsg = "use (glob) to match Windows paths too"

93

winglobmsg = "use (glob) to match Windows paths too"

94

uprefix = r"^ \$ "

94

uprefix = r"^ \$ "

95

utestpats = [

95

utestpats = [

96

[

96

[

97

(r'^(\S.*|| [$>] .*)[ \t]\n', "trailing whitespace on non-output"),

97

(r'^(\S.*|| [$>] .*)[ \t]\n', "trailing whitespace on non-output"),

98

(uprefix + r'.*\|\s*sed[^|>\n]*\n',

98

(uprefix + r'.*\|\s*sed[^|>\n]*\n',

99

"use regex test output patterns instead of sed"),

99

"use regex test output patterns instead of sed"),

100

(uprefix + r'(true|exit 0)', "explicit zero exit unnecessary"),

100

(uprefix + r'(true|exit 0)', "explicit zero exit unnecessary"),

101

(uprefix + r'.*(?<!\[)\$\?', "explicit exit code checks unnecessary"),

101

(uprefix + r'.*(?<!\[)\$\?', "explicit exit code checks unnecessary"),

102

(uprefix + r'.*\|\| echo.*(fail|error)',

102

(uprefix + r'.*\|\| echo.*(fail|error)',

103

"explicit exit code checks unnecessary"),

103

"explicit exit code checks unnecessary"),

104

(uprefix + r'set -e', "don't use set -e"),

104

(uprefix + r'set -e', "don't use set -e"),

105

(uprefix + r'\s', "don't indent commands, use > for continued lines"),

105

(uprefix + r'\s', "don't indent commands, use > for continued lines"),

106

(r'^ saved backup bundle to \$TESTTMP.*\.hg$', winglobmsg),

106

(r'^ saved backup bundle to \$TESTTMP.*\.hg$', winglobmsg),

107

(r'^ changeset .* references (corrupted|missing) \$TESTTMP/.*[^)]$',

107

(r'^ changeset .* references (corrupted|missing) \$TESTTMP/.*[^)]$',

108

winglobmsg),

108

winglobmsg),

109

(r'^ pulling from \$TESTTMP/.*[^)]$', winglobmsg, '\$TESTTMP/unix-repo$'),

109

(r'^ pulling from \$TESTTMP/.*[^)]$', winglobmsg, '\$TESTTMP/unix-repo$'),

110

],

110

],

111

# warnings

111

# warnings

112

[

112

[

113

(r'^ [^*?/\n]* $glob$$',

113

(r'^ [^*?/\n]* $glob$$',

114

"warning: glob match with no glob character (?*/)"),

114

"warning: glob match with no glob character (?*/)"),

115

]

115

]

116

]

116

]

117

118

for i in [0, 1]:

118

for i in [0, 1]:

119

for p, m in testpats[i]:

119

for p, m in testpats[i]:

120

if p.startswith(r'^'):

120

if p.startswith(r'^'):

121

p = r"^ [$>] (%s)" % p[1:]

121

p = r"^ [$>] (%s)" % p[1:]

122

else:

122

else:

123

p = r"^ [$>] .*(%s)" % p

123

p = r"^ [$>] .*(%s)" % p

124

utestpats[i].append((p, m))

124

utestpats[i].append((p, m))

125

126

utestfilters = [

126

utestfilters = [

127

(r"<<(\S+)((.|\n)*?\n > \1)", rephere),

127

(r"<<(\S+)((.|\n)*?\n > \1)", rephere),

128

(r"( *)(#([^\n]*\S)?)", repcomment),

128

(r"( *)(#([^\n]*\S)?)", repcomment),

129

]

129

]

130

131

pypats = [

131

pypats = [

132

[

132

[

133

(r'^\s*def\s*\w+\s*\(.*,\s*\(',

133

(r'^\s*def\s*\w+\s*\(.*,\s*\(',

134

"tuple parameter unpacking not available in Python 3+"),

134

"tuple parameter unpacking not available in Python 3+"),

135

(r'lambda\s*$.*,.*$',

135

(r'lambda\s*$.*,.*$',

136

"tuple parameter unpacking not available in Python 3+"),

136

"tuple parameter unpacking not available in Python 3+"),

137

(r'(?<!def)\s+(cmp)\(', "cmp is not available in Python 3+"),

137

(r'(?<!def)\s+(cmp)\(', "cmp is not available in Python 3+"),

138

(r'\breduce\s*\(.*', "reduce is not available in Python 3+"),

138

(r'\breduce\s*\(.*', "reduce is not available in Python 3+"),

139

(r'\.has_key\b', "dict.has_key is not available in Python 3+"),

139

(r'\.has_key\b', "dict.has_key is not available in Python 3+"),

140

(r'\s<>\s', '<> operator is not available in Python 3+, use !='),

140

(r'\s<>\s', '<> operator is not available in Python 3+, use !='),

141

(r'^\s*\t', "don't use tabs"),

141

(r'^\s*\t', "don't use tabs"),

142

(r'\S;\s*\n', "semicolon"),

142

(r'\S;\s*\n', "semicolon"),

143

(r'[^_]_\("[^"]+"\s*%', "don't use % inside _()"),

143

(r'[^_]_\("[^"]+"\s*%', "don't use % inside _()"),

144

(r"[^_]_\('[^']+'\s*%", "don't use % inside _()"),

144

(r"[^_]_\('[^']+'\s*%", "don't use % inside _()"),

145

(r'(\w|\)),\w', "missing whitespace after ,"),

145

(r'(\w|\)),\w', "missing whitespace after ,"),

146

(r'(\w|\))[+/*\-<>]\w', "missing whitespace in expression"),

146

(r'(\w|\))[+/*\-<>]\w', "missing whitespace in expression"),

147

(r'^\s+(\w|\.)+=\w[^,()\n]*$', "missing whitespace in assignment"),

147

(r'^\s+(\w|\.)+=\w[^,()\n]*$', "missing whitespace in assignment"),

148

(r'(\s+)try:\n((?:\n|\1\s.*\n)+?)\1except.*?:\n'

148

(r'(\s+)try:\n((?:\n|\1\s.*\n)+?)\1except.*?:\n'

149

r'((?:\n|\1\s.*\n)+?)\1finally:', 'no try/except/finally in Python 2.4'),

149

r'((?:\n|\1\s.*\n)+?)\1finally:', 'no try/except/finally in Python 2.4'),

150

(r'(\s+)try:\n((?:\n|\1\s.*\n)*?)\1\s*yield\b.*?'

150

(r'(\s+)try:\n((?:\n|\1\s.*\n)*?)\1\s*yield\b.*?'

151

r'((?:\n|\1\s.*\n)+?)\1finally:',

151

r'((?:\n|\1\s.*\n)+?)\1finally:',

152

'no yield inside try/finally in Python 2.4'),

152

'no yield inside try/finally in Python 2.4'),

153

(r'.{81}', "line too long"),

153

(r'.{81}', "line too long"),

154

(r' x+[xo][\'"]\n\s+[\'"]x', 'string join across lines with no space'),

154

(r' x+[xo][\'"]\n\s+[\'"]x', 'string join across lines with no space'),

155

(r'[^\n]\Z', "no trailing newline"),

155

(r'[^\n]\Z', "no trailing newline"),

156

(r'(\S[ \t]+|^[ \t]+)\n', "trailing whitespace"),

156

(r'(\S[ \t]+|^[ \t]+)\n', "trailing whitespace"),

157

# (r'^\s+[^_ \n][^_. \n]+_[^_\n]+\s*=',

157

# (r'^\s+[^_ \n][^_. \n]+_[^_\n]+\s*=',

158

# "don't use underbars in identifiers"),

158

# "don't use underbars in identifiers"),

159

(r'^\s+(self\.)?[A-za-z][a-z0-9]+[A-Z]\w* = ',

159

(r'^\s+(self\.)?[A-za-z][a-z0-9]+[A-Z]\w* = ',

160

"don't use camelcase in identifiers"),

160

"don't use camelcase in identifiers"),

161

161

162

"linebreak after :"),

162

"linebreak after :"),

163

(r'class\s[^( \n]+:', "old-style class, use class foo(object)"),

163

(r'class\s[^( \n]+:', "old-style class, use class foo(object)"),

164

(r'class\s[^( \n]+:',

164

(r'class\s[^( \n]+:',

165

"class foo() not available in Python 2.4, use class foo(object)"),

165

"class foo() not available in Python 2.4, use class foo(object)"),

166

(r'\b(%s)\(' % '|'.join(keyword.kwlist),

166

(r'\b(%s)\(' % '|'.join(keyword.kwlist),

167

"Python keyword is not a function"),

167

"Python keyword is not a function"),

168

(r',]', "unneeded trailing ',' in list"),

168

(r',]', "unneeded trailing ',' in list"),

169

# (r'class\s[A-Z][^\(]*\((?!Exception)',

169

# (r'class\s[A-Z][^\(]*\((?!Exception)',

170

# "don't capitalize non-exception classes"),

170

# "don't capitalize non-exception classes"),

171

# (r'in range\(', "use xrange"),

171

# (r'in range\(', "use xrange"),

172

# (r'^\s*print\s+', "avoid using print in core and extensions"),

172

# (r'^\s*print\s+', "avoid using print in core and extensions"),

173

(r'[\x80-\xff]', "non-ASCII character literal"),

173

(r'[\x80-\xff]', "non-ASCII character literal"),

174

(r'("\')\.format\(', "str.format() not available in Python 2.4"),

174

(r'("\')\.format\(', "str.format() not available in Python 2.4"),

175

(r'^\s*with\s+', "with not available in Python 2.4"),

175

(r'^\s*with\s+', "with not available in Python 2.4"),

176

(r'\.isdisjoint\(', "set.isdisjoint not available in Python 2.4"),

176

(r'\.isdisjoint\(', "set.isdisjoint not available in Python 2.4"),

177

(r'^\s*except.* as .*:', "except as not available in Python 2.4"),

177

(r'^\s*except.* as .*:', "except as not available in Python 2.4"),

178

(r'^\s*os\.path\.relpath', "relpath not available in Python 2.4"),

178

(r'^\s*os\.path\.relpath', "relpath not available in Python 2.4"),

179

(r'(?<!def)\s+(any|all|format)\(',

179

(r'(?<!def)\s+(any|all|format)\(',

180

"any/all/format not available in Python 2.4"),

180

"any/all/format not available in Python 2.4"),

181

(r'(?<!def)\s+(callable)\(',

181

(r'(?<!def)\s+(callable)\(',

182

"callable not available in Python 3, use getattr(f, '__call__', None)"),

182

"callable not available in Python 3, use getattr(f, '__call__', None)"),

183

(r'if\s.*\selse', "if ... else form not available in Python 2.4"),

183

(r'if\s.*\selse', "if ... else form not available in Python 2.4"),

184

(r'^\s*(%s)\s\s' % '|'.join(keyword.kwlist),

184

(r'^\s*(%s)\s\s' % '|'.join(keyword.kwlist),

185

"gratuitous whitespace after Python keyword"),

185

"gratuitous whitespace after Python keyword"),

186

(r'([$\[][ \t]\S)|(\S[ \t][$\]])', "gratuitous whitespace in () or []"),

186

(r'([$\[][ \t]\S)|(\S[ \t][$\]])', "gratuitous whitespace in () or []"),

187

# (r'\s\s=', "gratuitous whitespace before ="),

187

# (r'\s\s=', "gratuitous whitespace before ="),

188

(r'[^>< ](\+=|-=|!=|<>|<=|>=|<<=|>>=|%=)\S',

188

(r'[^>< ](\+=|-=|!=|<>|<=|>=|<<=|>>=|%=)\S',

189

"missing whitespace around operator"),

189

"missing whitespace around operator"),

190

(r'[^>< ](\+=|-=|!=|<>|<=|>=|<<=|>>=|%=)\s',

190

(r'[^>< ](\+=|-=|!=|<>|<=|>=|<<=|>>=|%=)\s',

191

"missing whitespace around operator"),

191

"missing whitespace around operator"),

192

(r'\s(\+=|-=|!=|<>|<=|>=|<<=|>>=|%=)\S',

192

(r'\s(\+=|-=|!=|<>|<=|>=|<<=|>>=|%=)\S',

193

"missing whitespace around operator"),

193

"missing whitespace around operator"),

194

(r'[^^+=*/!<>&| %-](\s=|=\s)[^= ]',

194

(r'[^^+=*/!<>&| %-](\s=|=\s)[^= ]',

195

"wrong whitespace around ="),

195

"wrong whitespace around ="),

196

(r'raise Exception', "don't raise generic exceptions"),

196

(r'raise Exception', "don't raise generic exceptions"),

197

(r'raise [^,(]+, ($[^$]+\)|[^,]+)$',

197

(r'raise [^,(]+, ($[^$]+\)|[^,]+)$',

198

"don't use old-style two-argument raise, use Exception(message)"),

198

"don't use old-style two-argument raise, use Exception(message)"),

199

(r' is\s+(not\s+)?["\'0-9-]', "object comparison with literal"),

199

(r' is\s+(not\s+)?["\'0-9-]', "object comparison with literal"),

200

(r' [=!]=\s+(True|False|None)',

200

(r' [=!]=\s+(True|False|None)',

201

"comparison with singleton, use 'is' or 'is not' instead"),

201

"comparison with singleton, use 'is' or 'is not' instead"),

202

(r'^\s*(while|if) [01]:',

202

(r'^\s*(while|if) [01]:',

203

"use True/False for constant Boolean expression"),

203

"use True/False for constant Boolean expression"),

204

(r'(?:(?<!def)\s+|\()hasattr',

204

(r'(?:(?<!def)\s+|\()hasattr',

205

'hasattr(foo, bar) is broken, use util.safehasattr(foo, bar) instead'),

205

'hasattr(foo, bar) is broken, use util.safehasattr(foo, bar) instead'),

206

(r'opener$[^)]*$.read\(',

206

(r'opener$[^)]*$.read\(',

207

"use opener.read() instead"),

207

"use opener.read() instead"),

208

(r'BaseException', 'not in Python 2.4, use Exception'),

208

(r'BaseException', 'not in Python 2.4, use Exception'),

209

(r'os\.path\.relpath', 'os.path.relpath is not in Python 2.5'),

209

(r'os\.path\.relpath', 'os.path.relpath is not in Python 2.5'),

210

(r'opener$[^)]*$.write\(',

210

(r'opener$[^)]*$.write\(',

211

"use opener.write() instead"),

211

"use opener.write() instead"),

212

(r'[\s$](open|file)\([^)]*$\.read\(',

212

(r'[\s$](open|file)\([^)]*$\.read\(',

213

"use util.readfile() instead"),

213

"use util.readfile() instead"),

214

(r'[\s$](open|file)\([^)]*$\.write\(',

214

(r'[\s$](open|file)\([^)]*$\.write\(',

215

"use util.readfile() instead"),

215

"use util.readfile() instead"),

216

(r'^[\s$]*(open(er)?|file)\([^)]*$',

216

(r'^[\s$]*(open(er)?|file)\([^)]*$',

217

"always assign an opened file to a variable, and close it afterwards"),

217

"always assign an opened file to a variable, and close it afterwards"),

218

(r'[\s$](open|file)\([^)]*$\.',

218

(r'[\s$](open|file)\([^)]*$\.',

219

"always assign an opened file to a variable, and close it afterwards"),

219

"always assign an opened file to a variable, and close it afterwards"),

220

(r'(?i)descendent', "the proper spelling is descendAnt"),

220

(r'(?i)descendent', "the proper spelling is descendAnt"),

221

(r'\.debug\(\_', "don't mark debug messages for translation"),

221

(r'\.debug\(\_', "don't mark debug messages for translation"),

222

(r'\.strip\.split', "no need to strip before splitting"),

222

(r'\.strip\.split', "no need to strip before splitting"),

223

(r'^\s*except\s*:', "naked except clause", r'#.*re-raises'),

223

(r'^\s*except\s*:', "naked except clause", r'#.*re-raises'),

224

(r':\n( )*( ){1,3}[^ ]', "must indent 4 spaces"),

224

(r':\n( )*( ){1,3}[^ ]', "must indent 4 spaces"),

225

(r'ui\.(status|progress|write|note|warn)\([\'\"]x',

225

(r'ui\.(status|progress|write|note|warn)\([\'\"]x',

226

"missing _() in ui message (use () to hide false-positives)"),

226

"missing _() in ui message (use () to hide false-positives)"),

227

],

227

],

228

# warnings

228

# warnings

229

[

229

[

230

]

230

]

231

]

231

]

232

233

pyfilters = [

233

pyfilters = [

234

(r"""(?msx)(?P<comment>\#.*?$)|

234

(r"""(?msx)(?P<comment>\#.*?$)|

235

((?P<quote>('''|\"\"\"|(?<!')'(?!')|(?<!")"(?!")))

235

((?P<quote>('''|\"\"\"|(?<!')'(?!')|(?<!")"(?!")))

236

(?P<text>(([^\\]|\\.)*?))

236

(?P<text>(([^\\]|\\.)*?))

237

(?P=quote))""", reppython),

237

(?P=quote))""", reppython),

238

]

238

]

239

240

txtfilters = []

241

242

txtpats = [

243

[

244

('\s$', 'trailing whitespace'),

245

],

246

[]

247

]

248

240

cpats = [

249

cpats = [

241

[

250

[

242

(r'//', "don't use //-style comments"),

251

(r'//', "don't use //-style comments"),

243

(r'^ ', "don't use spaces to indent"),

252

(r'^ ', "don't use spaces to indent"),

244

(r'\S\t', "don't use tabs except for indent"),

253

(r'\S\t', "don't use tabs except for indent"),

245

(r'(\S[ \t]+|^[ \t]+)\n', "trailing whitespace"),

254

(r'(\S[ \t]+|^[ \t]+)\n', "trailing whitespace"),

246

(r'.{81}', "line too long"),

255

(r'.{81}', "line too long"),

247

(r'(while|if|do|for)\(', "use space after while/if/do/for"),

256

(r'(while|if|do|for)\(', "use space after while/if/do/for"),

248

(r'return\(', "return is not a function"),

257

(r'return\(', "return is not a function"),

249

(r' ;', "no space before ;"),

258

(r' ;', "no space before ;"),

250

(r'\w+\* \w+', "use int *foo, not int* foo"),

259

(r'\w+\* \w+', "use int *foo, not int* foo"),

251

(r'$[^$]+\) \w+', "use (int)foo, not (int) foo"),

260

(r'$[^$]+\) \w+', "use (int)foo, not (int) foo"),

252

(r'\w+ (\+\+|--)', "use foo++, not foo ++"),

261

(r'\w+ (\+\+|--)', "use foo++, not foo ++"),

253

(r'\w,\w', "missing whitespace after ,"),

262

(r'\w,\w', "missing whitespace after ,"),

254

(r'^[^#]\w[+/*]\w', "missing whitespace in expression"),

263

(r'^[^#]\w[+/*]\w', "missing whitespace in expression"),

255

(r'^#\s+\w', "use #foo, not # foo"),

264

(r'^#\s+\w', "use #foo, not # foo"),

256

(r'[^\n]\Z', "no trailing newline"),

265

(r'[^\n]\Z', "no trailing newline"),

257

(r'^\s*#import\b', "use only #include in standard C code"),

266

(r'^\s*#import\b', "use only #include in standard C code"),

258

],

267

],

259

# warnings

268

# warnings

260

[]

269

[]

261

]

270

]

262

271

263

cfilters = [

272

cfilters = [

264

(r'(/\*)(((\*(?!/))|[^*])*)\*/', repccomment),

273

(r'(/\*)(((\*(?!/))|[^*])*)\*/', repccomment),

265

(r'''(?P<quote>(?<!")")(?P<text>([^"]|\\")+)"(?!")''', repquote),

274

(r'''(?P<quote>(?<!")")(?P<text>([^"]|\\")+)"(?!")''', repquote),

266

(r'''(#\s*include\s+<)([^>]+)>''', repinclude),

275

(r'''(#\s*include\s+<)([^>]+)>''', repinclude),

267

(r'($)([^)]+$)', repcallspaces),

276

(r'($)([^)]+$)', repcallspaces),

268

]

277

]

269

278

270

inutilpats = [

279

inutilpats = [

271

[

280

[

272

(r'\bui\.', "don't use ui in util"),

281

(r'\bui\.', "don't use ui in util"),

273

],

282

],

274

# warnings

283

# warnings

275

[]

284

[]

276

]

285

]

277

286

278

inrevlogpats = [

287

inrevlogpats = [

279

[

288

[

280

(r'\brepo\.', "don't use repo in revlog"),

289

(r'\brepo\.', "don't use repo in revlog"),

281

],

290

],

282

# warnings

291

# warnings

283

[]

292

[]

284

]

293

]

285

294

286

checks = [

295

checks = [

287

('python', r'.*\.(py|cgi)$', pyfilters, pypats),

296

('python', r'.*\.(py|cgi)$', pyfilters, pypats),

288

('test script', r'(.*/)?test-[^.~]*$', testfilters, testpats),

297

('test script', r'(.*/)?test-[^.~]*$', testfilters, testpats),

289

('c', r'.*\.c$', cfilters, cpats),

298

('c', r'.*\.c$', cfilters, cpats),

290

('unified test', r'.*\.t$', utestfilters, utestpats),

299

('unified test', r'.*\.t$', utestfilters, utestpats),

291

('layering violation repo in revlog', r'mercurial/revlog\.py', pyfilters,

300

('layering violation repo in revlog', r'mercurial/revlog\.py', pyfilters,

292

inrevlogpats),

301

inrevlogpats),

293

('layering violation ui in util', r'mercurial/util\.py', pyfilters,

302

('layering violation ui in util', r'mercurial/util\.py', pyfilters,

294

inutilpats),

303

inutilpats),

304

('txt', r'.*\.txt$', txtfilters, txtpats),

295

]

305

]

296

306

297

class norepeatlogger(object):

307

class norepeatlogger(object):

298

def __init__(self):

308

def __init__(self):

299

self._lastseen = None

309

self._lastseen = None

300

310

301

def log(self, fname, lineno, line, msg, blame):

311

def log(self, fname, lineno, line, msg, blame):

302

"""print error related a to given line of a given file.

312

"""print error related a to given line of a given file.

303

313

304

The faulty line will also be printed but only once in the case

314

The faulty line will also be printed but only once in the case

305

of multiple errors.

315

of multiple errors.

306

316

307

:fname: filename

317

:fname: filename

308

:lineno: line number

318

:lineno: line number

309

:line: actual content of the line

319

:line: actual content of the line

310

:msg: error message

320

:msg: error message

311

"""

321

"""

312

msgid = fname, lineno, line

322

msgid = fname, lineno, line

313

if msgid != self._lastseen:

323

if msgid != self._lastseen:

314

if blame:

324

if blame:

315

print "%s:%d (%s):" % (fname, lineno, blame)

325

print "%s:%d (%s):" % (fname, lineno, blame)

316

else:

326

else:

317

print "%s:%d:" % (fname, lineno)

327

print "%s:%d:" % (fname, lineno)

318

print " > %s" % line

328

print " > %s" % line

319

self._lastseen = msgid

329

self._lastseen = msgid

320

print " " + msg

330

print " " + msg

321

331

322

_defaultlogger = norepeatlogger()

332

_defaultlogger = norepeatlogger()

323

333

324

def getblame(f):

334

def getblame(f):

325

lines = []

335

lines = []

326

for l in os.popen('hg annotate -un %s' % f):

336

for l in os.popen('hg annotate -un %s' % f):

327

start, line = l.split(':', 1)

337

start, line = l.split(':', 1)

328

user, rev = start.split()

338

user, rev = start.split()

329

lines.append((line[1:-1], user, rev))

339

lines.append((line[1:-1], user, rev))

330

return lines

340

return lines

331

341

332

def checkfile(f, logfunc=_defaultlogger.log, maxerr=None, warnings=False,

342

def checkfile(f, logfunc=_defaultlogger.log, maxerr=None, warnings=False,

333

blame=False, debug=False, lineno=True):

343

blame=False, debug=False, lineno=True):

334

"""checks style and portability of a given file

344

"""checks style and portability of a given file

335

345

336

:f: filepath

346

:f: filepath

337

:logfunc: function used to report error

347

:logfunc: function used to report error

338

logfunc(filename, linenumber, linecontent, errormessage)

348

logfunc(filename, linenumber, linecontent, errormessage)

339

:maxerr: number of error to display before aborting.

349

:maxerr: number of error to display before aborting.

340

Set to false (default) to report all errors

350

Set to false (default) to report all errors

341

351

342

return True if no error is found, False otherwise.

352

return True if no error is found, False otherwise.

343

"""

353

"""

344

blamecache = None

354

blamecache = None

345

result = True

355

result = True

346

for name, match, filters, pats in checks:

356

for name, match, filters, pats in checks:

347

if debug:

357

if debug:

348

print name, f

358

print name, f

349

fc = 0

359

fc = 0

350

if not re.match(match, f):

360

if not re.match(match, f):

351

if debug:

361

if debug:

352

print "Skipping %s for %s it doesn't match %s" % (

362

print "Skipping %s for %s it doesn't match %s" % (

353

name, match, f)

363

name, match, f)

354

continue

364

continue

355

fp = open(f)

365

fp = open(f)

356

pre = post = fp.read()

366

pre = post = fp.read()

357

fp.close()

367

fp.close()

358

if "no-" + "check-code" in pre:

368

if "no-" + "check-code" in pre:

359

if debug:

369

if debug:

360

print "Skipping %s for %s it has no- and check-code" % (

370

print "Skipping %s for %s it has no- and check-code" % (

361

name, f)

371

name, f)

362

break

372

break

363

for p, r in filters:

373

for p, r in filters:

364

post = re.sub(p, r, post)

374

post = re.sub(p, r, post)

365

if warnings:

375

if warnings:

366

pats = pats[0] + pats[1]

376

pats = pats[0] + pats[1]

367

else:

377

else:

368

pats = pats[0]

378

pats = pats[0]

369

# print post # uncomment to show filtered version

379

# print post # uncomment to show filtered version

370

380

371

if debug:

381

if debug:

372

print "Checking %s for %s" % (name, f)

382

print "Checking %s for %s" % (name, f)

373

383

374

prelines = None

384

prelines = None

375

errors = []

385

errors = []

376

for pat in pats:

386

for pat in pats:

377

if len(pat) == 3:

387

if len(pat) == 3:

378

p, msg, ignore = pat

388

p, msg, ignore = pat

379

else:

389

else:

380

p, msg = pat

390

p, msg = pat

381

ignore = None

391

ignore = None

382

392

383

# fix-up regexes for multi-line searches

393

# fix-up regexes for multi-line searches

384

po = p

394

po = p

385

# \s doesn't match \n

395

# \s doesn't match \n

386

p = re.sub(r'(?<!\\)\\s', r'[ \\t]', p)

396

p = re.sub(r'(?<!\\)\\s', r'[ \\t]', p)

387

# [^...] doesn't match newline

397

# [^...] doesn't match newline

388

p = re.sub(r'(?<!\\)\[\^', r'[^\\n', p)

398

p = re.sub(r'(?<!\\)\[\^', r'[^\\n', p)

389

399

390

#print po, '=>', p

400

#print po, '=>', p

391

401

392

pos = 0

402

pos = 0

393

n = 0

403

n = 0

394

for m in re.finditer(p, post, re.MULTILINE):

404

for m in re.finditer(p, post, re.MULTILINE):

395

if prelines is None:

405

if prelines is None:

396

prelines = pre.splitlines()

406

prelines = pre.splitlines()

397

postlines = post.splitlines(True)

407

postlines = post.splitlines(True)

398

408

399

start = m.start()

409

start = m.start()

400

while n < len(postlines):

410

while n < len(postlines):

401

step = len(postlines[n])

411

step = len(postlines[n])

402

if pos + step > start:

412

if pos + step > start:

403

break

413

break

404

pos += step

414

pos += step

405

n += 1

415

n += 1

406

l = prelines[n]

416

l = prelines[n]

407

417

408

if "check-code" + "-ignore" in l:

418

if "check-code" + "-ignore" in l:

409

if debug:

419

if debug:

410

print "Skipping %s for %s:%s (check-code -ignore)" % (

420

print "Skipping %s for %s:%s (check-code -ignore)" % (

411

name, f, n)

421

name, f, n)

412

continue

422

continue

413

elif ignore and re.search(ignore, l, re.MULTILINE):

423

elif ignore and re.search(ignore, l, re.MULTILINE):

414

continue

424

continue

415

bd = ""

425

bd = ""

416

if blame:

426

if blame:

417

bd = 'working directory'

427

bd = 'working directory'

418

if not blamecache:

428

if not blamecache:

419

blamecache = getblame(f)

429

blamecache = getblame(f)

420

if n < len(blamecache):

430

if n < len(blamecache):

421

bl, bu, br = blamecache[n]

431

bl, bu, br = blamecache[n]

422

if bl == l:

432

if bl == l:

423

bd = '%s@%s' % (bu, br)

433

bd = '%s@%s' % (bu, br)

424

errors.append((f, lineno and n + 1, l, msg, bd))

434

errors.append((f, lineno and n + 1, l, msg, bd))

425

result = False

435

result = False

426

436

427

errors.sort()

437

errors.sort()

428

for e in errors:

438

for e in errors:

429

logfunc(*e)

439

logfunc(*e)

430

fc += 1

440

fc += 1

431

if maxerr and fc >= maxerr:

441

if maxerr and fc >= maxerr:

432

print " (too many errors, giving up)"

442

print " (too many errors, giving up)"

433

break

443

break

434

444

435

return result

445

return result

436

446

437

if __name__ == "__main__":

447

if __name__ == "__main__":

438

parser = optparse.OptionParser("%prog [options] [files]")

448

parser = optparse.OptionParser("%prog [options] [files]")

439

parser.add_option("-w", "--warnings", action="store_true",

449

parser.add_option("-w", "--warnings", action="store_true",

440

help="include warning-level checks")

450

help="include warning-level checks")

441

parser.add_option("-p", "--per-file", type="int",

451

parser.add_option("-p", "--per-file", type="int",

442

help="max warnings per file")

452

help="max warnings per file")

443

parser.add_option("-b", "--blame", action="store_true",

453

parser.add_option("-b", "--blame", action="store_true",

444

help="use annotate to generate blame info")

454

help="use annotate to generate blame info")

445

parser.add_option("", "--debug", action="store_true",

455

parser.add_option("", "--debug", action="store_true",

446

help="show debug information")

456

help="show debug information")

447

parser.add_option("", "--nolineno", action="store_false",

457

parser.add_option("", "--nolineno", action="store_false",

448

dest='lineno', help="don't show line numbers")

458

dest='lineno', help="don't show line numbers")

449

459

450

parser.set_defaults(per_file=15, warnings=False, blame=False, debug=False,

460

parser.set_defaults(per_file=15, warnings=False, blame=False, debug=False,

451

lineno=True)

461

lineno=True)

452

(options, args) = parser.parse_args()

462

(options, args) = parser.parse_args()

453

463

454

if len(args) == 0:

464

if len(args) == 0:

455

check = glob.glob("*")

465

check = glob.glob("*")

456

else:

466

else:

457

check = args

467

check = args

458

468

459

ret = 0

469

ret = 0

460

for f in check:

470

for f in check:

461

if not checkfile(f, maxerr=options.per_file, warnings=options.warnings,

471

if not checkfile(f, maxerr=options.per_file, warnings=options.warnings,

462

blame=options.blame, debug=options.debug,

472

blame=options.blame, debug=options.debug,

463

lineno=options.lineno):

473

lineno=options.lineno):

464

ret = 1

474

ret = 1

465

sys.exit(ret)

475

sys.exit(ret)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             #!/usr/bin/env python
             #
             # check-code - a style and portability checker for Mercurial
             #
             # Copyright 2010 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             import re, glob, os, sys
             import keyword
             import optparse
             def repquote(m):
                 t = re.sub(r"\w", "x", m.group('text'))
                 t = re.sub(r"[^\s\nx]", "o", t)
                 return m.group('quote') + t + m.group('quote')
             def reppython(m):
                 comment = m.group('comment')
                 if comment:
                     l = len(comment.rstrip())
                     return "#" * l + comment[l:]
                 return repquote(m)
             def repcomment(m):
                 return m.group(1) + "#" * len(m.group(2))
             def repccomment(m):
                 t = re.sub(r"((?<=\n) )|\S", "x", m.group(2))
                 return m.group(1) + t + "*/"
             def repcallspaces(m):
                 t = re.sub(r"\n\s+", "\n", m.group(2))
                 return m.group(1) + t
             def repinclude(m):
                 return m.group(1) + "<foo>"
             def rephere(m):
                 t = re.sub(r"\S", "x", m.group(2))
                 return m.group(1) + t
             testpats = [
               [
                 (r'pushd|popd', "don't use 'pushd' or 'popd', use 'cd'"),
                 (r'\W\$?\(\([^\)\n]*\)\)', "don't use (()) or $(()), use 'expr'"),
                 (r'grep.*-q', "don't use 'grep -q', redirect to /dev/null"),
                 (r'sed.*-i', "don't use 'sed -i', use a temporary file"),
                 (r'\becho\b.*\\n', "don't use 'echo \\n', use printf"),
                 (r'echo -n', "don't use 'echo -n', use printf"),
                 (r'(^| )wc[^|]*$\n(?!.*\(re\))', "filter wc output"),
                 (r'head -c', "don't use 'head -c', use 'dd'"),
                 (r'sha1sum', "don't use sha1sum, use $TESTDIR/md5sum.py"),
                 (r'ls.*-\w*R', "don't use 'ls -R', use 'find'"),
                 (r'printf.*\\([1-9]|0\d)', "don't use 'printf \NNN', use Python"),
                 (r'printf.*\\x', "don't use printf \\x, use Python"),
                 (r'\$\(.*\)', "don't use $(expr), use `expr`"),
                 (r'rm -rf \*', "don't use naked rm -rf, target a directory"),
                 (r'(^|\|\s*)grep (-\w\s+)*[^|]*[(|]\w',
                  "use egrep for extended grep syntax"),
                 (r'/bin/', "don't use explicit paths for tools"),
                 (r'[^\n]\Z', "no trailing newline"),
                 (r'export.*=', "don't export and assign at once"),
                 (r'^source\b', "don't use 'source', use '.'"),
                 (r'touch -d', "don't use 'touch -d', use 'touch -t' instead"),
                 (r'ls +[^|\n-]+ +-', "options to 'ls' must come before filenames"),
                 (r'[^>\n]>\s*\$HGRCPATH', "don't overwrite $HGRCPATH, append to it"),
                 (r'^stop\(\)', "don't use 'stop' as a shell function name"),
                 (r'(\[|\btest\b).*-e ', "don't use 'test -e', use 'test -f'"),
                 (r'^alias\b.*=', "don't use alias, use a function"),
                 (r'if\s*!', "don't use '!' to negate exit status"),
                 (r'/dev/u?random', "don't use entropy, use /dev/zero"),
                 (r'do\s*true;\s*done', "don't use true as loop body, use sleep 0"),
                 (r'^( *)\t', "don't use tabs to indent"),
               ],
               # warnings
               [
                 (r'^function', "don't use 'function', use old style"),
                 (r'^diff.*-\w*N', "don't use 'diff -N'"),
                 (r'\$PWD|\${PWD}', "don't use $PWD, use `pwd`"),
                 (r'^([^"\'\n]|("[^"\n]*")|(\'[^\'\n]*\'))*\^', "^ must be quoted"),
                 (r'kill (`|\$\()', "don't use kill, use killdaemons.py")
               ]
             ]
             testfilters = [
                 (r"( *)(#([^\n]*\S)?)", repcomment),
                 (r"<<(\S+)((.|\n)*?\n\1)", rephere),
             ]
             winglobmsg = "use (glob) to match Windows paths too"
             uprefix = r"^  \$ "
             utestpats = [
               [
                 (r'^(\S.*||  [$>] .*)[ \t]\n', "trailing whitespace on non-output"),
                 (uprefix + r'.*\|\s*sed[^|>\n]*\n',
                  "use regex test output patterns instead of sed"),
                 (uprefix + r'(true|exit 0)', "explicit zero exit unnecessary"),
                 (uprefix + r'.*(?<!\[)\$\?', "explicit exit code checks unnecessary"),
                 (uprefix + r'.*\|\| echo.*(fail|error)',
                  "explicit exit code checks unnecessary"),
                 (uprefix + r'set -e', "don't use set -e"),
                 (uprefix + r'\s', "don't indent commands, use > for continued lines"),
                 (r'^  saved backup bundle to \$TESTTMP.*\.hg$', winglobmsg),
                 (r'^  changeset .* references (corrupted|missing) \$TESTTMP/.*[^)]$',
                  winglobmsg),
                 (r'^  pulling from \$TESTTMP/.*[^)]$', winglobmsg, '\$TESTTMP/unix-repo$'),
               ],
               # warnings
               [
                 (r'^  [^*?/\n]* \(glob\)$',
                  "warning: glob match with no glob character (?*/)"),
               ]
             ]
             for i in [0, 1]:
                 for p, m in testpats[i]:
                     if p.startswith(r'^'):
                         p = r"^  [$>] (%s)" % p[1:]
                     else:
                         p = r"^  [$>] .*(%s)" % p
                     utestpats[i].append((p, m))
             utestfilters = [
                 (r"<<(\S+)((.|\n)*?\n  > \1)", rephere),
                 (r"( *)(#([^\n]*\S)?)", repcomment),
             ]
             pypats = [
               [
                 (r'^\s*def\s*\w+\s*\(.*,\s*\(',
                  "tuple parameter unpacking not available in Python 3+"),
                 (r'lambda\s*\(.*,.*\)',
                  "tuple parameter unpacking not available in Python 3+"),
                 (r'(?<!def)\s+(cmp)\(', "cmp is not available in Python 3+"),
                 (r'\breduce\s*\(.*', "reduce is not available in Python 3+"),
                 (r'\.has_key\b', "dict.has_key is not available in Python 3+"),
                 (r'\s<>\s', '<> operator is not available in Python 3+, use !='),
                 (r'^\s*\t', "don't use tabs"),
                 (r'\S;\s*\n', "semicolon"),
                 (r'[^_]_\("[^"]+"\s*%', "don't use % inside _()"),
                 (r"[^_]_\('[^']+'\s*%", "don't use % inside _()"),
                 (r'(\w|\)),\w', "missing whitespace after ,"),
                 (r'(\w|\))[+/*\-<>]\w', "missing whitespace in expression"),
                 (r'^\s+(\w|\.)+=\w[^,()\n]*$', "missing whitespace in assignment"),
                 (r'(\s+)try:\n((?:\n|\1\s.*\n)+?)\1except.*?:\n'
                  r'((?:\n|\1\s.*\n)+?)\1finally:', 'no try/except/finally in Python 2.4'),
                 (r'(\s+)try:\n((?:\n|\1\s.*\n)*?)\1\s*yield\b.*?'
                  r'((?:\n|\1\s.*\n)+?)\1finally:',
                  'no yield inside try/finally in Python 2.4'),
                 (r'.{81}', "line too long"),
                 (r' x+[xo][\'"]\n\s+[\'"]x', 'string join across lines with no space'),
                 (r'[^\n]\Z', "no trailing newline"),
                 (r'(\S[ \t]+|^[ \t]+)\n', "trailing whitespace"),
             #    (r'^\s+[^_ \n][^_. \n]+_[^_\n]+\s*=',
             #     "don't use underbars in identifiers"),
                 (r'^\s+(self\.)?[A-za-z][a-z0-9]+[A-Z]\w* = ',
                  "don't use camelcase in identifiers"),
                 (r'^\s*(if|while|def|class|except|try)\s[^[\n]*:\s*[^\\n]#\s]+',
                  "linebreak after :"),
                 (r'class\s[^( \n]+:', "old-style class, use class foo(object)"),
                 (r'class\s[^( \n]+\(\):',
                  "class foo() not available in Python 2.4, use class foo(object)"),
                 (r'\b(%s)\(' % '|'.join(keyword.kwlist),
                  "Python keyword is not a function"),
                 (r',]', "unneeded trailing ',' in list"),
             #    (r'class\s[A-Z][^\(]*\((?!Exception)',
             #     "don't capitalize non-exception classes"),
             #    (r'in range\(', "use xrange"),
             #    (r'^\s*print\s+', "avoid using print in core and extensions"),
                 (r'[\x80-\xff]', "non-ASCII character literal"),
                 (r'("\')\.format\(', "str.format() not available in Python 2.4"),
                 (r'^\s*with\s+', "with not available in Python 2.4"),
                 (r'\.isdisjoint\(', "set.isdisjoint not available in Python 2.4"),
                 (r'^\s*except.* as .*:', "except as not available in Python 2.4"),
                 (r'^\s*os\.path\.relpath', "relpath not available in Python 2.4"),
                 (r'(?<!def)\s+(any|all|format)\(',
                  "any/all/format not available in Python 2.4"),
                 (r'(?<!def)\s+(callable)\(',
                  "callable not available in Python 3, use getattr(f, '__call__', None)"),
                 (r'if\s.*\selse', "if ... else form not available in Python 2.4"),
                 (r'^\s*(%s)\s\s' % '|'.join(keyword.kwlist),
                  "gratuitous whitespace after Python keyword"),
                 (r'([\(\[][ \t]\S)|(\S[ \t][\)\]])', "gratuitous whitespace in () or []"),
             #    (r'\s\s=', "gratuitous whitespace before ="),
                 (r'[^>< ](\+=|-=|!=|<>|<=|>=|<<=|>>=|%=)\S',
                  "missing whitespace around operator"),
                 (r'[^>< ](\+=|-=|!=|<>|<=|>=|<<=|>>=|%=)\s',
                  "missing whitespace around operator"),
                 (r'\s(\+=|-=|!=|<>|<=|>=|<<=|>>=|%=)\S',
                  "missing whitespace around operator"),
                 (r'[^^+=*/!<>&| %-](\s=|=\s)[^= ]',
                  "wrong whitespace around ="),
                 (r'raise Exception', "don't raise generic exceptions"),
                 (r'raise [^,(]+, (\([^\)]+\)|[^,\(\)]+)$',
                  "don't use old-style two-argument raise, use Exception(message)"),
                 (r' is\s+(not\s+)?["\'0-9-]', "object comparison with literal"),
                 (r' [=!]=\s+(True|False|None)',
                  "comparison with singleton, use 'is' or 'is not' instead"),
                 (r'^\s*(while|if) [01]:',
                  "use True/False for constant Boolean expression"),
                 (r'(?:(?<!def)\s+|\()hasattr',
                  'hasattr(foo, bar) is broken, use util.safehasattr(foo, bar) instead'),
                 (r'opener\([^)]*\).read\(',
                  "use opener.read() instead"),
                 (r'BaseException', 'not in Python 2.4, use Exception'),
                 (r'os\.path\.relpath', 'os.path.relpath is not in Python 2.5'),
                 (r'opener\([^)]*\).write\(',
                  "use opener.write() instead"),
                 (r'[\s\(](open|file)\([^)]*\)\.read\(',
                  "use util.readfile() instead"),
                 (r'[\s\(](open|file)\([^)]*\)\.write\(',
                  "use util.readfile() instead"),
                 (r'^[\s\(]*(open(er)?|file)\([^)]*\)',
                  "always assign an opened file to a variable, and close it afterwards"),
                 (r'[\s\(](open|file)\([^)]*\)\.',
                  "always assign an opened file to a variable, and close it afterwards"),
                 (r'(?i)descendent', "the proper spelling is descendAnt"),
                 (r'\.debug\(\_', "don't mark debug messages for translation"),
                 (r'\.strip\(\)\.split\(\)', "no need to strip before splitting"),
                 (r'^\s*except\s*:', "naked except clause", r'#.*re-raises'),
                 (r':\n(    )*( ){1,3}[^ ]', "must indent 4 spaces"),
                 (r'ui\.(status|progress|write|note|warn)\([\'\"]x',
                  "missing _() in ui message (use () to hide false-positives)"),
               ],
               # warnings
               [
               ]
             ]
             pyfilters = [
                 (r"""(?msx)(?P<comment>\#.*?$)|
                      ((?P<quote>('''|\"\"\"|(?<!')'(?!')|(?<!")"(?!")))
                       (?P<text>(([^\\]|\\.)*?))
                       (?P=quote))""", reppython),
             ]
+            txtfilters = []
+            txtpats = [
+              [
+                ('\s$', 'trailing whitespace'),
+              ],
+              []
+            ]
             cpats = [
               [
                 (r'//', "don't use //-style comments"),
                 (r'^  ', "don't use spaces to indent"),
                 (r'\S\t', "don't use tabs except for indent"),
                 (r'(\S[ \t]+|^[ \t]+)\n', "trailing whitespace"),
                 (r'.{81}', "line too long"),
                 (r'(while|if|do|for)\(', "use space after while/if/do/for"),
                 (r'return\(', "return is not a function"),
                 (r' ;', "no space before ;"),
                 (r'\w+\* \w+', "use int *foo, not int* foo"),
                 (r'\([^\)]+\) \w+', "use (int)foo, not (int) foo"),
                 (r'\w+ (\+\+|--)', "use foo++, not foo ++"),
                 (r'\w,\w', "missing whitespace after ,"),
                 (r'^[^#]\w[+/*]\w', "missing whitespace in expression"),
                 (r'^#\s+\w', "use #foo, not # foo"),
                 (r'[^\n]\Z', "no trailing newline"),
                 (r'^\s*#import\b', "use only #include in standard C code"),
               ],
               # warnings
               []
             ]
             cfilters = [
                 (r'(/\*)(((\*(?!/))|[^*])*)\*/', repccomment),
                 (r'''(?P<quote>(?<!")")(?P<text>([^"]|\\")+)"(?!")''', repquote),
                 (r'''(#\s*include\s+<)([^>]+)>''', repinclude),
                 (r'(\()([^)]+\))', repcallspaces),
             ]
             inutilpats = [
               [
                 (r'\bui\.', "don't use ui in util"),
               ],
               # warnings
               []
             ]
             inrevlogpats = [
               [
                 (r'\brepo\.', "don't use repo in revlog"),
               ],
               # warnings
               []
             ]
             checks = [
                 ('python', r'.*\.(py|cgi)$', pyfilters, pypats),
                 ('test script', r'(.*/)?test-[^.~]*$', testfilters, testpats),
                 ('c', r'.*\.c$', cfilters, cpats),
                 ('unified test', r'.*\.t$', utestfilters, utestpats),
                 ('layering violation repo in revlog', r'mercurial/revlog\.py', pyfilters,
                  inrevlogpats),
                 ('layering violation ui in util', r'mercurial/util\.py', pyfilters,
                  inutilpats),
+                ('txt', r'.*\.txt$', txtfilters, txtpats),
             ]
             class norepeatlogger(object):
                 def __init__(self):
                     self._lastseen = None
                 def log(self, fname, lineno, line, msg, blame):
                     """print error related a to given line of a given file.
                     The faulty line will also be printed but only once in the case
                     of multiple errors.
                     :fname: filename
                     :lineno: line number
                     :line: actual content of the line
                     :msg: error message
                     """
                     msgid = fname, lineno, line
                     if msgid != self._lastseen:
                         if blame:
                             print "%s:%d (%s):" % (fname, lineno, blame)
                         else:
                             print "%s:%d:" % (fname, lineno)
                         print " > %s" % line
                         self._lastseen = msgid
                     print " " + msg
             _defaultlogger = norepeatlogger()
             def getblame(f):
                 lines = []
                 for l in os.popen('hg annotate -un %s' % f):
                     start, line = l.split(':', 1)
                     user, rev = start.split()
                     lines.append((line[1:-1], user, rev))
                 return lines
             def checkfile(f, logfunc=_defaultlogger.log, maxerr=None, warnings=False,
                           blame=False, debug=False, lineno=True):
                 """checks style and portability of a given file
                 :f: filepath
                 :logfunc: function used to report error
                           logfunc(filename, linenumber, linecontent, errormessage)
                 :maxerr: number of error to display before aborting.
                          Set to false (default) to report all errors
                 return True if no error is found, False otherwise.
                 """
                 blamecache = None
                 result = True
                 for name, match, filters, pats in checks:
                     if debug:
                         print name, f
                     fc = 0
                     if not re.match(match, f):
                         if debug:
                             print "Skipping %s for %s it doesn't match %s" % (
                                    name, match, f)
                         continue
                     fp = open(f)
                     pre = post = fp.read()
                     fp.close()
                     if "no-" + "check-code" in pre:
                         if debug:
                             print "Skipping %s for %s it has no- and check-code" % (
                                    name, f)
                         break
                     for p, r in filters:
                         post = re.sub(p, r, post)
                     if warnings:
                         pats = pats[0] + pats[1]
                     else:
                         pats = pats[0]
                     # print post # uncomment to show filtered version
                     if debug:
                         print "Checking %s for %s" % (name, f)
                     prelines = None
                     errors = []
                     for pat in pats:
                         if len(pat) == 3:
                             p, msg, ignore = pat
                         else:
                             p, msg = pat
                             ignore = None
                         # fix-up regexes for multi-line searches
                         po = p
                         # \s doesn't match \n
                         p = re.sub(r'(?<!\\)\\s', r'[ \\t]', p)
                         # [^...] doesn't match newline
                         p = re.sub(r'(?<!\\)\[\^', r'[^\\n', p)
                         #print po, '=>', p
                         pos = 0
                         n = 0
                         for m in re.finditer(p, post, re.MULTILINE):
                             if prelines is None:
                                 prelines = pre.splitlines()
                                 postlines = post.splitlines(True)
                             start = m.start()
                             while n < len(postlines):
                                 step = len(postlines[n])
                                 if pos + step > start:
                                     break
                                 pos += step
                                 n += 1
                             l = prelines[n]
                             if "check-code" + "-ignore" in l:
                                 if debug:
                                     print "Skipping %s for %s:%s (check-code -ignore)" % (
                                         name, f, n)
                                 continue
                             elif ignore and re.search(ignore, l, re.MULTILINE):
                                 continue
                             bd = ""
                             if blame:
                                 bd = 'working directory'
                                 if not blamecache:
                                     blamecache = getblame(f)
                                 if n < len(blamecache):
                                     bl, bu, br = blamecache[n]
                                     if bl == l:
                                         bd = '%s@%s' % (bu, br)
                             errors.append((f, lineno and n + 1, l, msg, bd))
                             result = False
                     errors.sort()
                     for e in errors:
                         logfunc(*e)
                         fc += 1
                         if maxerr and fc >= maxerr:
                             print " (too many errors, giving up)"
                             break
                 return result
             if __name__ == "__main__":
                 parser = optparse.OptionParser("%prog [options] [files]")
                 parser.add_option("-w", "--warnings", action="store_true",
                                   help="include warning-level checks")
                 parser.add_option("-p", "--per-file", type="int",
                                   help="max warnings per file")
                 parser.add_option("-b", "--blame", action="store_true",
                                   help="use annotate to generate blame info")
                 parser.add_option("", "--debug", action="store_true",
                                   help="show debug information")
                 parser.add_option("", "--nolineno", action="store_false",
                                   dest='lineno', help="don't show line numbers")
                 parser.set_defaults(per_file=15, warnings=False, blame=False, debug=False,
                                     lineno=True)
                 (options, args) = parser.parse_args()
                 if len(args) == 0:
                     check = glob.glob("*")
                 else:
                     check = args
                 ret = 0
                 for f in check:
                     if not checkfile(f, maxerr=options.per_file, warnings=options.warnings,
                                      blame=options.blame, debug=options.debug,
                                      lineno=options.lineno):
                         ret = 1
                 sys.exit(ret)