upstream/mercurial-mirror Commit - r38039:2f406142

1

# match.py - filename matching

1

# match.py - filename matching

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import, print_function

8

from __future__ import absolute_import, print_function

9

10

import copy

10

import copy

11

import os

11

import os

12

import re

12

import re

13

14

from .i18n import _

14

from .i18n import _

15

from . import (

15

from . import (

16

encoding,

16

encoding,

17

error,

17

error,

18

pathutil,

18

pathutil,

19

pycompat,

19

pycompat,

20

util,

20

util,

21

)

21

)

22

from .utils import (

22

from .utils import (

23

stringutil,

23

stringutil,

24

)

24

)

25

26

allpatternkinds = ('re', 'glob', 'path', 'relglob', 'relpath', 'relre',

26

allpatternkinds = ('re', 'glob', 'path', 'relglob', 'relpath', 'relre',

27

'listfile', 'listfile0', 'set', 'include', 'subinclude',

27

'listfile', 'listfile0', 'set', 'include', 'subinclude',

28

'rootfilesin')

28

'rootfilesin')

29

cwdrelativepatternkinds = ('relpath', 'glob')

29

cwdrelativepatternkinds = ('relpath', 'glob')

30

31

propertycache = util.propertycache

31

propertycache = util.propertycache

32

33

def _rematcher(regex):

33

def _rematcher(regex):

34

'''compile the regexp with the best available regexp engine and return a

34

'''compile the regexp with the best available regexp engine and return a

35

matcher function'''

35

matcher function'''

36

m = util.re.compile(regex)

36

m = util.re.compile(regex)

37

try:

37

try:

38

# slightly faster, provided by facebook's re2 bindings

38

# slightly faster, provided by facebook's re2 bindings

39

return m.test_match

39

return m.test_match

40

except AttributeError:

40

except AttributeError:

41

return m.match

41

return m.match

42

43

def _expandsets(kindpats, ctx, listsubrepos):

43

def _expandsets(kindpats, ctx, listsubrepos):

44

'''Returns the kindpats list with the 'set' patterns expanded.'''

44

'''Returns the kindpats list with the 'set' patterns expanded.'''

45

fset = set()

45

fset = set()

46

other = []

46

other = []

47

48

for kind, pat, source in kindpats:

48

for kind, pat, source in kindpats:

49

if kind == 'set':

49

if kind == 'set':

50

if not ctx:

50

if not ctx:

51

raise error.ProgrammingError("fileset expression with no "

51

raise error.ProgrammingError("fileset expression with no "

52

"context")

52

"context")

53

s = ctx.getfileset(pat)

53

s = ctx.getfileset(pat)

54

fset.update(s)

54

fset.update(s)

55

56

if listsubrepos:

56

if listsubrepos:

57

for subpath in ctx.substate:

57

for subpath in ctx.substate:

58

s = ctx.sub(subpath).getfileset(pat)

58

s = ctx.sub(subpath).getfileset(pat)

59

fset.update(subpath + '/' + f for f in s)

59

fset.update(subpath + '/' + f for f in s)

60

61

continue

61

continue

62

other.append((kind, pat, source))

62

other.append((kind, pat, source))

63

return fset, other

63

return fset, other

64

65

def _expandsubinclude(kindpats, root):

65

def _expandsubinclude(kindpats, root):

66

'''Returns the list of subinclude matcher args and the kindpats without the

66

'''Returns the list of subinclude matcher args and the kindpats without the

67

subincludes in it.'''

67

subincludes in it.'''

68

relmatchers = []

68

relmatchers = []

69

other = []

69

other = []

70

71

for kind, pat, source in kindpats:

71

for kind, pat, source in kindpats:

72

if kind == 'subinclude':

72

if kind == 'subinclude':

73

sourceroot = pathutil.dirname(util.normpath(source))

73

sourceroot = pathutil.dirname(util.normpath(source))

74

pat = util.pconvert(pat)

74

pat = util.pconvert(pat)

75

path = pathutil.join(sourceroot, pat)

75

path = pathutil.join(sourceroot, pat)

76

77

newroot = pathutil.dirname(path)

77

newroot = pathutil.dirname(path)

78

matcherargs = (newroot, '', [], ['include:%s' % path])

78

matcherargs = (newroot, '', [], ['include:%s' % path])

79

80

prefix = pathutil.canonpath(root, root, newroot)

80

prefix = pathutil.canonpath(root, root, newroot)

81

if prefix:

81

if prefix:

82

prefix += '/'

82

prefix += '/'

83

relmatchers.append((prefix, matcherargs))

83

relmatchers.append((prefix, matcherargs))

84

else:

84

else:

85

other.append((kind, pat, source))

85

other.append((kind, pat, source))

86

87

return relmatchers, other

87

return relmatchers, other

88

89

def _kindpatsalwaysmatch(kindpats):

89

def _kindpatsalwaysmatch(kindpats):

90

""""Checks whether the kindspats match everything, as e.g.

90

""""Checks whether the kindspats match everything, as e.g.

91

'relpath:.' does.

91

'relpath:.' does.

92

"""

92

"""

93

for kind, pat, source in kindpats:

93

for kind, pat, source in kindpats:

94

if pat != '' or kind not in ['relpath', 'glob']:

94

if pat != '' or kind not in ['relpath', 'glob']:

95

return False

95

return False

96

return True

96

return True

97

98

def match(root, cwd, patterns=None, include=None, exclude=None, default='glob',

98

def match(root, cwd, patterns=None, include=None, exclude=None, default='glob',

99

exact=False, auditor=None, ctx=None, listsubrepos=False, warn=None,

99

exact=False, auditor=None, ctx=None, listsubrepos=False, warn=None,

100

badfn=None, icasefs=False):

100

badfn=None, icasefs=False):

101

"""build an object to match a set of file patterns

101

"""build an object to match a set of file patterns

102

103

arguments:

103

arguments:

104

root - the canonical root of the tree you're matching against

104

root - the canonical root of the tree you're matching against

105

cwd - the current working directory, if relevant

105

cwd - the current working directory, if relevant

106

patterns - patterns to find

106

patterns - patterns to find

107

include - patterns to include (unless they are excluded)

107

include - patterns to include (unless they are excluded)

108

exclude - patterns to exclude (even if they are included)

108

exclude - patterns to exclude (even if they are included)

109

default - if a pattern in patterns has no explicit type, assume this one

109

default - if a pattern in patterns has no explicit type, assume this one

110

exact - patterns are actually filenames (include/exclude still apply)

110

exact - patterns are actually filenames (include/exclude still apply)

111

warn - optional function used for printing warnings

111

warn - optional function used for printing warnings

112

badfn - optional bad() callback for this matcher instead of the default

112

badfn - optional bad() callback for this matcher instead of the default

113

icasefs - make a matcher for wdir on case insensitive filesystems, which

113

icasefs - make a matcher for wdir on case insensitive filesystems, which

114

normalizes the given patterns to the case in the filesystem

114

normalizes the given patterns to the case in the filesystem

115

116

a pattern is one of:

116

a pattern is one of:

117

'glob:<glob>' - a glob relative to cwd

117

'glob:<glob>' - a glob relative to cwd

118

're:<regexp>' - a regular expression

118

're:<regexp>' - a regular expression

119

'path:<path>' - a path relative to repository root, which is matched

119

'path:<path>' - a path relative to repository root, which is matched

120

recursively

120

recursively

121

'rootfilesin:<path>' - a path relative to repository root, which is

121

'rootfilesin:<path>' - a path relative to repository root, which is

122

matched non-recursively (will not match subdirectories)

122

matched non-recursively (will not match subdirectories)

123

'relglob:<glob>' - an unrooted glob (*.c matches C files in all dirs)

123

'relglob:<glob>' - an unrooted glob (*.c matches C files in all dirs)

124

'relpath:<path>' - a path relative to cwd

124

'relpath:<path>' - a path relative to cwd

125

'relre:<regexp>' - a regexp that needn't match the start of a name

125

'relre:<regexp>' - a regexp that needn't match the start of a name

126

'set:<fileset>' - a fileset expression

126

'set:<fileset>' - a fileset expression

127

'include:<path>' - a file of patterns to read and include

127

'include:<path>' - a file of patterns to read and include

128

'subinclude:<path>' - a file of patterns to match against files under

128

'subinclude:<path>' - a file of patterns to match against files under

129

the same directory

129

the same directory

130

'<something>' - a pattern of the specified default type

130

'<something>' - a pattern of the specified default type

131

"""

131

"""

132

normalize = _donormalize

132

normalize = _donormalize

133

if icasefs:

133

if icasefs:

134

if exact:

134

if exact:

135

raise error.ProgrammingError("a case-insensitive exact matcher "

135

raise error.ProgrammingError("a case-insensitive exact matcher "

136

"doesn't make sense")

136

"doesn't make sense")

137

dirstate = ctx.repo().dirstate

137

dirstate = ctx.repo().dirstate

138

dsnormalize = dirstate.normalize

138

dsnormalize = dirstate.normalize

139

140

def normalize(patterns, default, root, cwd, auditor, warn):

140

def normalize(patterns, default, root, cwd, auditor, warn):

141

kp = _donormalize(patterns, default, root, cwd, auditor, warn)

141

kp = _donormalize(patterns, default, root, cwd, auditor, warn)

142

kindpats = []

142

kindpats = []

143

for kind, pats, source in kp:

143

for kind, pats, source in kp:

144

if kind not in ('re', 'relre'): # regex can't be normalized

144

if kind not in ('re', 'relre'): # regex can't be normalized

145

p = pats

145

p = pats

146

pats = dsnormalize(pats)

146

pats = dsnormalize(pats)

147

148

# Preserve the original to handle a case only rename.

148

# Preserve the original to handle a case only rename.

149

if p != pats and p in dirstate:

149

if p != pats and p in dirstate:

150

kindpats.append((kind, p, source))

150

kindpats.append((kind, p, source))

151

152

kindpats.append((kind, pats, source))

152

kindpats.append((kind, pats, source))

153

return kindpats

153

return kindpats

154

155

if exact:

155

if exact:

156

m = exactmatcher(root, cwd, patterns, badfn)

156

m = exactmatcher(root, cwd, patterns, badfn)

157

elif patterns:

157

elif patterns:

158

kindpats = normalize(patterns, default, root, cwd, auditor, warn)

158

kindpats = normalize(patterns, default, root, cwd, auditor, warn)

159

if _kindpatsalwaysmatch(kindpats):

159

if _kindpatsalwaysmatch(kindpats):

160

m = alwaysmatcher(root, cwd, badfn, relativeuipath=True)

160

m = alwaysmatcher(root, cwd, badfn, relativeuipath=True)

161

else:

161

else:

162

m = patternmatcher(root, cwd, kindpats, ctx=ctx,

162

m = patternmatcher(root, cwd, kindpats, ctx=ctx,

163

listsubrepos=listsubrepos, badfn=badfn)

163

listsubrepos=listsubrepos, badfn=badfn)

164

else:

164

else:

165

# It's a little strange that no patterns means to match everything.

165

# It's a little strange that no patterns means to match everything.

166

# Consider changing this to match nothing (probably using nevermatcher).

166

# Consider changing this to match nothing (probably using nevermatcher).

167

m = alwaysmatcher(root, cwd, badfn)

167

m = alwaysmatcher(root, cwd, badfn)

168

169

if include:

169

if include:

170

kindpats = normalize(include, 'glob', root, cwd, auditor, warn)

170

kindpats = normalize(include, 'glob', root, cwd, auditor, warn)

171

im = includematcher(root, cwd, kindpats, ctx=ctx,

171

im = includematcher(root, cwd, kindpats, ctx=ctx,

172

listsubrepos=listsubrepos, badfn=None)

172

listsubrepos=listsubrepos, badfn=None)

173

m = intersectmatchers(m, im)

173

m = intersectmatchers(m, im)

174

if exclude:

174

if exclude:

175

kindpats = normalize(exclude, 'glob', root, cwd, auditor, warn)

175

kindpats = normalize(exclude, 'glob', root, cwd, auditor, warn)

176

em = includematcher(root, cwd, kindpats, ctx=ctx,

176

em = includematcher(root, cwd, kindpats, ctx=ctx,

177

listsubrepos=listsubrepos, badfn=None)

177

listsubrepos=listsubrepos, badfn=None)

178

m = differencematcher(m, em)

178

m = differencematcher(m, em)

179

return m

179

return m

180

181

def exact(root, cwd, files, badfn=None):

181

def exact(root, cwd, files, badfn=None):

182

return exactmatcher(root, cwd, files, badfn=badfn)

182

return exactmatcher(root, cwd, files, badfn=badfn)

183

184

def always(root, cwd):

184

def always(root, cwd):

185

return alwaysmatcher(root, cwd)

185

return alwaysmatcher(root, cwd)

186

187

def never(root, cwd):

187

def never(root, cwd):

188

return nevermatcher(root, cwd)

188

return nevermatcher(root, cwd)

189

190

def badmatch(match, badfn):

190

def badmatch(match, badfn):

191

"""Make a copy of the given matcher, replacing its bad method with the given

191

"""Make a copy of the given matcher, replacing its bad method with the given

192

one.

192

one.

193

"""

193

"""

194

m = copy.copy(match)

194

m = copy.copy(match)

195

m.bad = badfn

195

m.bad = badfn

196

return m

196

return m

197

198

def _donormalize(patterns, default, root, cwd, auditor, warn):

198

def _donormalize(patterns, default, root, cwd, auditor, warn):

199

'''Convert 'kind:pat' from the patterns list to tuples with kind and

199

'''Convert 'kind:pat' from the patterns list to tuples with kind and

200

normalized and rooted patterns and with listfiles expanded.'''

200

normalized and rooted patterns and with listfiles expanded.'''

201

kindpats = []

201

kindpats = []

202

for kind, pat in [_patsplit(p, default) for p in patterns]:

202

for kind, pat in [_patsplit(p, default) for p in patterns]:

203

if kind in cwdrelativepatternkinds:

203

if kind in cwdrelativepatternkinds:

204

pat = pathutil.canonpath(root, cwd, pat, auditor)

204

pat = pathutil.canonpath(root, cwd, pat, auditor)

205

elif kind in ('relglob', 'path', 'rootfilesin'):

205

elif kind in ('relglob', 'path', 'rootfilesin'):

206

pat = util.normpath(pat)

206

pat = util.normpath(pat)

207

elif kind in ('listfile', 'listfile0'):

207

elif kind in ('listfile', 'listfile0'):

208

try:

208

try:

209

files = util.readfile(pat)

209

files = util.readfile(pat)

210

if kind == 'listfile0':

210

if kind == 'listfile0':

211

files = files.split('\0')

211

files = files.split('\0')

212

else:

212

else:

213

files = files.splitlines()

213

files = files.splitlines()

214

files = [f for f in files if f]

214

files = [f for f in files if f]

215

except EnvironmentError:

215

except EnvironmentError:

216

raise error.Abort(_("unable to read file list (%s)") % pat)

216

raise error.Abort(_("unable to read file list (%s)") % pat)

217

for k, p, source in _donormalize(files, default, root, cwd,

217

for k, p, source in _donormalize(files, default, root, cwd,

218

auditor, warn):

218

auditor, warn):

219

kindpats.append((k, p, pat))

219

kindpats.append((k, p, pat))

220

continue

220

continue

221

elif kind == 'include':

221

elif kind == 'include':

222

try:

222

try:

223

fullpath = os.path.join(root, util.localpath(pat))

223

fullpath = os.path.join(root, util.localpath(pat))

224

includepats = readpatternfile(fullpath, warn)

224

includepats = readpatternfile(fullpath, warn)

225

for k, p, source in _donormalize(includepats, default,

225

for k, p, source in _donormalize(includepats, default,

226

root, cwd, auditor, warn):

226

root, cwd, auditor, warn):

227

kindpats.append((k, p, source or pat))

227

kindpats.append((k, p, source or pat))

228

except error.Abort as inst:

228

except error.Abort as inst:

229

raise error.Abort('%s: %s' % (pat, inst[0]))

229

raise error.Abort('%s: %s' % (pat, inst[0]))

230

except IOError as inst:

230

except IOError as inst:

231

if warn:

231

if warn:

232

warn(_("skipping unreadable pattern file '%s': %s\n") %

232

warn(_("skipping unreadable pattern file '%s': %s\n") %

233

(pat, stringutil.forcebytestr(inst.strerror)))

233

(pat, stringutil.forcebytestr(inst.strerror)))

234

continue

234

continue

235

# else: re or relre - which cannot be normalized

235

# else: re or relre - which cannot be normalized

236

kindpats.append((kind, pat, ''))

236

kindpats.append((kind, pat, ''))

237

return kindpats

237

return kindpats

238

239

class basematcher(object):

239

class basematcher(object):

240

241

def __init__(self, root, cwd, badfn=None, relativeuipath=True):

241

def __init__(self, root, cwd, badfn=None, relativeuipath=True):

242

self._root = root

242

self._root = root

243

self._cwd = cwd

243

self._cwd = cwd

244

if badfn is not None:

244

if badfn is not None:

245

self.bad = badfn

245

self.bad = badfn

246

self._relativeuipath = relativeuipath

246

self._relativeuipath = relativeuipath

247

248

def __call__(self, fn):

248

def __call__(self, fn):

249

return self.matchfn(fn)

249

return self.matchfn(fn)

250

def __iter__(self):

250

def __iter__(self):

251

for f in self._files:

251

for f in self._files:

252

yield f

252

yield f

253

# Callbacks related to how the matcher is used by dirstate.walk.

253

# Callbacks related to how the matcher is used by dirstate.walk.

254

# Subscribers to these events must monkeypatch the matcher object.

254

# Subscribers to these events must monkeypatch the matcher object.

255

def bad(self, f, msg):

255

def bad(self, f, msg):

256

'''Callback from dirstate.walk for each explicit file that can't be

256

'''Callback from dirstate.walk for each explicit file that can't be

257

found/accessed, with an error message.'''

257

found/accessed, with an error message.'''

258

259

# If an explicitdir is set, it will be called when an explicitly listed

259

# If an explicitdir is set, it will be called when an explicitly listed

260

# directory is visited.

260

# directory is visited.

261

explicitdir = None

261

explicitdir = None

262

263

# If an traversedir is set, it will be called when a directory discovered

263

# If an traversedir is set, it will be called when a directory discovered

264

# by recursive traversal is visited.

264

# by recursive traversal is visited.

265

traversedir = None

265

traversedir = None

266

267

def abs(self, f):

267

def abs(self, f):

268

'''Convert a repo path back to path that is relative to the root of the

268

'''Convert a repo path back to path that is relative to the root of the

269

matcher.'''

269

matcher.'''

270

return f

270

return f

271

272

def rel(self, f):

272

def rel(self, f):

273

'''Convert repo path back to path that is relative to cwd of matcher.'''

273

'''Convert repo path back to path that is relative to cwd of matcher.'''

274

return util.pathto(self._root, self._cwd, f)

274

return util.pathto(self._root, self._cwd, f)

275

276

def uipath(self, f):

276

def uipath(self, f):

277

'''Convert repo path to a display path. If patterns or -I/-X were used

277

'''Convert repo path to a display path. If patterns or -I/-X were used

278

to create this matcher, the display path will be relative to cwd.

278

to create this matcher, the display path will be relative to cwd.

279

Otherwise it is relative to the root of the repo.'''

279

Otherwise it is relative to the root of the repo.'''

280

return (self._relativeuipath and self.rel(f)) or self.abs(f)

280

return (self._relativeuipath and self.rel(f)) or self.abs(f)

281

282

@propertycache

282

@propertycache

283

def _files(self):

283

def _files(self):

284

return []

284

return []

285

286

def files(self):

286

def files(self):

287

'''Explicitly listed files or patterns or roots:

287

'''Explicitly listed files or patterns or roots:

288

if no patterns or .always(): empty list,

288

if no patterns or .always(): empty list,

289

if exact: list exact files,

289

if exact: list exact files,

290

if not .anypats(): list all files and dirs,

290

if not .anypats(): list all files and dirs,

291

else: optimal roots'''

291

else: optimal roots'''

292

return self._files

292

return self._files

293

294

@propertycache

294

@propertycache

295

def _fileset(self):

295

def _fileset(self):

296

return set(self._files)

296

return set(self._files)

297

298

def exact(self, f):

298

def exact(self, f):

299

'''Returns True if f is in .files().'''

299

'''Returns True if f is in .files().'''

300

return f in self._fileset

300

return f in self._fileset

301

302

def matchfn(self, f):

302

def matchfn(self, f):

303

return False

303

return False

304

305

def visitdir(self, dir):

305

def visitdir(self, dir):

306

'''Decides whether a directory should be visited based on whether it

306

'''Decides whether a directory should be visited based on whether it

307

has potential matches in it or one of its subdirectories. This is

307

has potential matches in it or one of its subdirectories. This is

308

based on the match's primary, included, and excluded patterns.

308

based on the match's primary, included, and excluded patterns.

309

310

Returns the string 'all' if the given directory and all subdirectories

310

Returns the string 'all' if the given directory and all subdirectories

311

should be visited. Otherwise returns True or False indicating whether

311

should be visited. Otherwise returns True or False indicating whether

312

the given directory should be visited.

312

the given directory should be visited.

313

'''

313

'''

314

return True

314

return True

315

316

def always(self):

316

def always(self):

317

'''Matcher will match everything and .files() will be empty --

317

'''Matcher will match everything and .files() will be empty --

318

optimization might be possible.'''

318

optimization might be possible.'''

319

return False

319

return False

320

321

def isexact(self):

321

def isexact(self):

322

'''Matcher will match exactly the list of files in .files() --

322

'''Matcher will match exactly the list of files in .files() --

323

optimization might be possible.'''

323

optimization might be possible.'''

324

return False

324

return False

325

326

def prefix(self):

326

def prefix(self):

327

'''Matcher will match the paths in .files() recursively --

327

'''Matcher will match the paths in .files() recursively --

328

optimization might be possible.'''

328

optimization might be possible.'''

329

return False

329

return False

330

331

def anypats(self):

331

def anypats(self):

332

'''None of .always(), .isexact(), and .prefix() is true --

332

'''None of .always(), .isexact(), and .prefix() is true --

333

optimizations will be difficult.'''

333

optimizations will be difficult.'''

334

return not self.always() and not self.isexact() and not self.prefix()

334

return not self.always() and not self.isexact() and not self.prefix()

335

336

class alwaysmatcher(basematcher):

336

class alwaysmatcher(basematcher):

337

'''Matches everything.'''

337

'''Matches everything.'''

338

339

def __init__(self, root, cwd, badfn=None, relativeuipath=False):

339

def __init__(self, root, cwd, badfn=None, relativeuipath=False):

340

super(alwaysmatcher, self).__init__(root, cwd, badfn,

340

super(alwaysmatcher, self).__init__(root, cwd, badfn,

341

relativeuipath=relativeuipath)

341

relativeuipath=relativeuipath)

342

343

def always(self):

343

def always(self):

344

return True

344

return True

345

346

def matchfn(self, f):

346

def matchfn(self, f):

347

return True

347

return True

348

349

def visitdir(self, dir):

349

def visitdir(self, dir):

350

return 'all'

350

return 'all'

351

352

def __repr__(self):

352

def __repr__(self):

353

return r'<alwaysmatcher>'

353

return r'<alwaysmatcher>'

354

355

class nevermatcher(basematcher):

355

class nevermatcher(basematcher):

356

'''Matches nothing.'''

356

'''Matches nothing.'''

357

358

def __init__(self, root, cwd, badfn=None):

358

def __init__(self, root, cwd, badfn=None):

359

super(nevermatcher, self).__init__(root, cwd, badfn)

359

super(nevermatcher, self).__init__(root, cwd, badfn)

360

361

# It's a little weird to say that the nevermatcher is an exact matcher

361

# It's a little weird to say that the nevermatcher is an exact matcher

362

# or a prefix matcher, but it seems to make sense to let callers take

362

# or a prefix matcher, but it seems to make sense to let callers take

363

# fast paths based on either. There will be no exact matches, nor any

363

# fast paths based on either. There will be no exact matches, nor any

364

# prefixes (files() returns []), so fast paths iterating over them should

364

# prefixes (files() returns []), so fast paths iterating over them should

365

# be efficient (and correct).

365

# be efficient (and correct).

366

def isexact(self):

366

def isexact(self):

367

return True

367

return True

368

369

def prefix(self):

369

def prefix(self):

370

return True

370

return True

371

372

def visitdir(self, dir):

372

def visitdir(self, dir):

373

return False

373

return False

374

375

def __repr__(self):

375

def __repr__(self):

376

return r'<nevermatcher>'

376

return r'<nevermatcher>'

377

378

class patternmatcher(basematcher):

378

class patternmatcher(basematcher):

379

380

def __init__(self, root, cwd, kindpats, ctx=None, listsubrepos=False,

380

def __init__(self, root, cwd, kindpats, ctx=None, listsubrepos=False,

381

badfn=None):

381

badfn=None):

382

super(patternmatcher, self).__init__(root, cwd, badfn)

382

super(patternmatcher, self).__init__(root, cwd, badfn)

383

384

self._files = _explicitfiles(kindpats)

384

self._files = _explicitfiles(kindpats)

385

self._prefix = _prefix(kindpats)

385

self._prefix = _prefix(kindpats)

386

self._pats, self.matchfn = _buildmatch(ctx, kindpats, '$', listsubrepos,

386

self._pats, self.matchfn = _buildmatch(ctx, kindpats, '$', listsubrepos,

387

root)

387

root)

388

389

@propertycache

389

@propertycache

390

def _dirs(self):

390

def _dirs(self):

391

return set(util.dirs(self._fileset)) | {'.'}

391

return set(util.dirs(self._fileset)) | {'.'}

392

393

def visitdir(self, dir):

393

def visitdir(self, dir):

394

if self._prefix and dir in self._fileset:

394

if self._prefix and dir in self._fileset:

395

return 'all'

395

return 'all'

396

return ('.' in self._fileset or

396

return ('.' in self._fileset or

397

dir in self._fileset or

397

dir in self._fileset or

398

dir in self._dirs or

398

dir in self._dirs or

399

any(parentdir in self._fileset

399

any(parentdir in self._fileset

400

for parentdir in util.finddirs(dir)))

400

for parentdir in util.finddirs(dir)))

401

402

def prefix(self):

402

def prefix(self):

403

return self._prefix

403

return self._prefix

404

405

@encoding.strmethod

405

@encoding.strmethod

406

def __repr__(self):

406

def __repr__(self):

407

return ('<patternmatcher patterns=%r>' % self._pats)

407

return ('<patternmatcher patterns=%r>' % pycompat.bytestr(self._pats))

408

409

class includematcher(basematcher):

409

class includematcher(basematcher):

410

411

def __init__(self, root, cwd, kindpats, ctx=None, listsubrepos=False,

411

def __init__(self, root, cwd, kindpats, ctx=None, listsubrepos=False,

412

badfn=None):

412

badfn=None):

413

super(includematcher, self).__init__(root, cwd, badfn)

413

super(includematcher, self).__init__(root, cwd, badfn)

414

415

self._pats, self.matchfn = _buildmatch(ctx, kindpats, '(?:/|$)',

415

self._pats, self.matchfn = _buildmatch(ctx, kindpats, '(?:/|$)',

416

listsubrepos, root)

416

listsubrepos, root)

417

self._prefix = _prefix(kindpats)

417

self._prefix = _prefix(kindpats)

418

roots, dirs = _rootsanddirs(kindpats)

418

roots, dirs = _rootsanddirs(kindpats)

419

# roots are directories which are recursively included.

419

# roots are directories which are recursively included.

420

self._roots = set(roots)

420

self._roots = set(roots)

421

# dirs are directories which are non-recursively included.

421

# dirs are directories which are non-recursively included.

422

self._dirs = set(dirs)

422

self._dirs = set(dirs)

423

424

def visitdir(self, dir):

424

def visitdir(self, dir):

425

if self._prefix and dir in self._roots:

425

if self._prefix and dir in self._roots:

426

return 'all'

426

return 'all'

427

return ('.' in self._roots or

427

return ('.' in self._roots or

428

dir in self._roots or

428

dir in self._roots or

429

dir in self._dirs or

429

dir in self._dirs or

430

any(parentdir in self._roots

430

any(parentdir in self._roots

431

for parentdir in util.finddirs(dir)))

431

for parentdir in util.finddirs(dir)))

432

433

@encoding.strmethod

433

@encoding.strmethod

434

def __repr__(self):

434

def __repr__(self):

435

return ('<includematcher includes=%r>' % pycompat.bytestr(self._pats))

435

return ('<includematcher includes=%r>' % pycompat.bytestr(self._pats))

436

437

class exactmatcher(basematcher):

437

class exactmatcher(basematcher):

438

'''Matches the input files exactly. They are interpreted as paths, not

438

'''Matches the input files exactly. They are interpreted as paths, not

439

patterns (so no kind-prefixes).

439

patterns (so no kind-prefixes).

440

'''

440

'''

441

442

def __init__(self, root, cwd, files, badfn=None):

442

def __init__(self, root, cwd, files, badfn=None):

443

super(exactmatcher, self).__init__(root, cwd, badfn)

443

super(exactmatcher, self).__init__(root, cwd, badfn)

444

445

if isinstance(files, list):

445

if isinstance(files, list):

446

self._files = files

446

self._files = files

447

else:

447

else:

448

self._files = list(files)

448

self._files = list(files)

449

450

matchfn = basematcher.exact

450

matchfn = basematcher.exact

451

452

@propertycache

452

@propertycache

453

def _dirs(self):

453

def _dirs(self):

454

return set(util.dirs(self._fileset)) | {'.'}

454

return set(util.dirs(self._fileset)) | {'.'}

455

456

def visitdir(self, dir):

456

def visitdir(self, dir):

457

return dir in self._dirs

457

return dir in self._dirs

458

459

def isexact(self):

459

def isexact(self):

460

return True

460

return True

461

462

@encoding.strmethod

462

@encoding.strmethod

463

def __repr__(self):

463

def __repr__(self):

464

return ('<exactmatcher files=%r>' % self._files)

464

return ('<exactmatcher files=%r>' % self._files)

465

466

class differencematcher(basematcher):

466

class differencematcher(basematcher):

467

'''Composes two matchers by matching if the first matches and the second

467

'''Composes two matchers by matching if the first matches and the second

468

does not.

468

does not.

469

470

The second matcher's non-matching-attributes (root, cwd, bad, explicitdir,

470

The second matcher's non-matching-attributes (root, cwd, bad, explicitdir,

471

traversedir) are ignored.

471

traversedir) are ignored.

472

'''

472

'''

473

def __init__(self, m1, m2):

473

def __init__(self, m1, m2):

474

super(differencematcher, self).__init__(m1._root, m1._cwd)

474

super(differencematcher, self).__init__(m1._root, m1._cwd)

475

self._m1 = m1

475

self._m1 = m1

476

self._m2 = m2

476

self._m2 = m2

477

self.bad = m1.bad

477

self.bad = m1.bad

478

self.explicitdir = m1.explicitdir

478

self.explicitdir = m1.explicitdir

479

self.traversedir = m1.traversedir

479

self.traversedir = m1.traversedir

480

481

def matchfn(self, f):

481

def matchfn(self, f):

482

return self._m1(f) and not self._m2(f)

482

return self._m1(f) and not self._m2(f)

483

484

@propertycache

484

@propertycache

485

def _files(self):

485

def _files(self):

486

if self.isexact():

486

if self.isexact():

487

return [f for f in self._m1.files() if self(f)]

487

return [f for f in self._m1.files() if self(f)]

488

# If m1 is not an exact matcher, we can't easily figure out the set of

488

# If m1 is not an exact matcher, we can't easily figure out the set of

489

# files, because its files() are not always files. For example, if

489

# files, because its files() are not always files. For example, if

490

# m1 is "path:dir" and m2 is "rootfileins:.", we don't

490

# m1 is "path:dir" and m2 is "rootfileins:.", we don't

491

# want to remove "dir" from the set even though it would match m2,

491

# want to remove "dir" from the set even though it would match m2,

492

# because the "dir" in m1 may not be a file.

492

# because the "dir" in m1 may not be a file.

493

return self._m1.files()

493

return self._m1.files()

494

495

def visitdir(self, dir):

495

def visitdir(self, dir):

496

if self._m2.visitdir(dir) == 'all':

496

if self._m2.visitdir(dir) == 'all':

497

return False

497

return False

498

return bool(self._m1.visitdir(dir))

498

return bool(self._m1.visitdir(dir))

499

500

def isexact(self):

500

def isexact(self):

501

return self._m1.isexact()

501

return self._m1.isexact()

502

503

@encoding.strmethod

503

@encoding.strmethod

504

def __repr__(self):

504

def __repr__(self):

505

return ('<differencematcher m1=%r, m2=%r>' % (self._m1, self._m2))

505

return ('<differencematcher m1=%r, m2=%r>' % (self._m1, self._m2))

506

507

def intersectmatchers(m1, m2):

507

def intersectmatchers(m1, m2):

508

'''Composes two matchers by matching if both of them match.

508

'''Composes two matchers by matching if both of them match.

509

510

The second matcher's non-matching-attributes (root, cwd, bad, explicitdir,

510

The second matcher's non-matching-attributes (root, cwd, bad, explicitdir,

511

traversedir) are ignored.

511

traversedir) are ignored.

512

'''

512

'''

513

if m1 is None or m2 is None:

513

if m1 is None or m2 is None:

514

return m1 or m2

514

return m1 or m2

515

if m1.always():

515

if m1.always():

516

m = copy.copy(m2)

516

m = copy.copy(m2)

517

# TODO: Consider encapsulating these things in a class so there's only

517

# TODO: Consider encapsulating these things in a class so there's only

518

# one thing to copy from m1.

518

# one thing to copy from m1.

519

m.bad = m1.bad

519

m.bad = m1.bad

520

m.explicitdir = m1.explicitdir

520

m.explicitdir = m1.explicitdir

521

m.traversedir = m1.traversedir

521

m.traversedir = m1.traversedir

522

m.abs = m1.abs

522

m.abs = m1.abs

523

m.rel = m1.rel

523

m.rel = m1.rel

524

m._relativeuipath |= m1._relativeuipath

524

m._relativeuipath |= m1._relativeuipath

525

return m

525

return m

526

if m2.always():

526

if m2.always():

527

m = copy.copy(m1)

527

m = copy.copy(m1)

528

m._relativeuipath |= m2._relativeuipath

528

m._relativeuipath |= m2._relativeuipath

529

return m

529

return m

530

return intersectionmatcher(m1, m2)

530

return intersectionmatcher(m1, m2)

531

532

class intersectionmatcher(basematcher):

532

class intersectionmatcher(basematcher):

533

def __init__(self, m1, m2):

533

def __init__(self, m1, m2):

534

super(intersectionmatcher, self).__init__(m1._root, m1._cwd)

534

super(intersectionmatcher, self).__init__(m1._root, m1._cwd)

535

self._m1 = m1

535

self._m1 = m1

536

self._m2 = m2

536

self._m2 = m2

537

self.bad = m1.bad

537

self.bad = m1.bad

538

self.explicitdir = m1.explicitdir

538

self.explicitdir = m1.explicitdir

539

self.traversedir = m1.traversedir

539

self.traversedir = m1.traversedir

540

541

@propertycache

541

@propertycache

542

def _files(self):

542

def _files(self):

543

if self.isexact():

543

if self.isexact():

544

m1, m2 = self._m1, self._m2

544

m1, m2 = self._m1, self._m2

545

if not m1.isexact():

545

if not m1.isexact():

546

m1, m2 = m2, m1

546

m1, m2 = m2, m1

547

return [f for f in m1.files() if m2(f)]

547

return [f for f in m1.files() if m2(f)]

548

# It neither m1 nor m2 is an exact matcher, we can't easily intersect

548

# It neither m1 nor m2 is an exact matcher, we can't easily intersect

549

# the set of files, because their files() are not always files. For

549

# the set of files, because their files() are not always files. For

550

# example, if intersecting a matcher "-I glob:foo.txt" with matcher of

550

# example, if intersecting a matcher "-I glob:foo.txt" with matcher of

551

# "path:dir2", we don't want to remove "dir2" from the set.

551

# "path:dir2", we don't want to remove "dir2" from the set.

552

return self._m1.files() + self._m2.files()

552

return self._m1.files() + self._m2.files()

553

554

def matchfn(self, f):

554

def matchfn(self, f):

555

return self._m1(f) and self._m2(f)

555

return self._m1(f) and self._m2(f)

556

557

def visitdir(self, dir):

557

def visitdir(self, dir):

558

visit1 = self._m1.visitdir(dir)

558

visit1 = self._m1.visitdir(dir)

559

if visit1 == 'all':

559

if visit1 == 'all':

560

return self._m2.visitdir(dir)

560

return self._m2.visitdir(dir)

561

# bool() because visit1=True + visit2='all' should not be 'all'

561

# bool() because visit1=True + visit2='all' should not be 'all'

562

return bool(visit1 and self._m2.visitdir(dir))

562

return bool(visit1 and self._m2.visitdir(dir))

563

564

def always(self):

564

def always(self):

565

return self._m1.always() and self._m2.always()

565

return self._m1.always() and self._m2.always()

566

567

def isexact(self):

567

def isexact(self):

568

return self._m1.isexact() or self._m2.isexact()

568

return self._m1.isexact() or self._m2.isexact()

569

570

@encoding.strmethod

570

@encoding.strmethod

571

def __repr__(self):

571

def __repr__(self):

572

return ('<intersectionmatcher m1=%r, m2=%r>' % (self._m1, self._m2))

572

return ('<intersectionmatcher m1=%r, m2=%r>' % (self._m1, self._m2))

573

574

class subdirmatcher(basematcher):

574

class subdirmatcher(basematcher):

575

"""Adapt a matcher to work on a subdirectory only.

575

"""Adapt a matcher to work on a subdirectory only.

576

577

The paths are remapped to remove/insert the path as needed:

577

The paths are remapped to remove/insert the path as needed:

578

579

>>> from . import pycompat

579

>>> from . import pycompat

580

>>> m1 = match(b'root', b'', [b'a.txt', b'sub/b.txt'])

580

>>> m1 = match(b'root', b'', [b'a.txt', b'sub/b.txt'])

581

>>> m2 = subdirmatcher(b'sub', m1)

581

>>> m2 = subdirmatcher(b'sub', m1)

582

>>> bool(m2(b'a.txt'))

582

>>> bool(m2(b'a.txt'))

583

False

583

False

584

>>> bool(m2(b'b.txt'))

584

>>> bool(m2(b'b.txt'))

585

True

585

True

586

>>> bool(m2.matchfn(b'a.txt'))

586

>>> bool(m2.matchfn(b'a.txt'))

587

False

587

False

588

>>> bool(m2.matchfn(b'b.txt'))

588

>>> bool(m2.matchfn(b'b.txt'))

589

True

589

True

590

>>> m2.files()

590

>>> m2.files()

591

['b.txt']

591

['b.txt']

592

>>> m2.exact(b'b.txt')

592

>>> m2.exact(b'b.txt')

593

True

593

True

594

>>> util.pconvert(m2.rel(b'b.txt'))

594

>>> util.pconvert(m2.rel(b'b.txt'))

595

'sub/b.txt'

595

'sub/b.txt'

596

>>> def bad(f, msg):

596

>>> def bad(f, msg):

597

... print(pycompat.sysstr(b"%s: %s" % (f, msg)))

597

... print(pycompat.sysstr(b"%s: %s" % (f, msg)))

598

>>> m1.bad = bad

598

>>> m1.bad = bad

599

>>> m2.bad(b'x.txt', b'No such file')

599

>>> m2.bad(b'x.txt', b'No such file')

600

sub/x.txt: No such file

600

sub/x.txt: No such file

601

>>> m2.abs(b'c.txt')

601

>>> m2.abs(b'c.txt')

602

'sub/c.txt'

602

'sub/c.txt'

603

"""

603

"""

604

605

def __init__(self, path, matcher):

605

def __init__(self, path, matcher):

606

super(subdirmatcher, self).__init__(matcher._root, matcher._cwd)

606

super(subdirmatcher, self).__init__(matcher._root, matcher._cwd)

607

self._path = path

607

self._path = path

608

self._matcher = matcher

608

self._matcher = matcher

609

self._always = matcher.always()

609

self._always = matcher.always()

610

611

self._files = [f[len(path) + 1:] for f in matcher._files

611

self._files = [f[len(path) + 1:] for f in matcher._files

612

if f.startswith(path + "/")]

612

if f.startswith(path + "/")]

613

614

# If the parent repo had a path to this subrepo and the matcher is

614

# If the parent repo had a path to this subrepo and the matcher is

615

# a prefix matcher, this submatcher always matches.

615

# a prefix matcher, this submatcher always matches.

616

if matcher.prefix():

616

if matcher.prefix():

617

self._always = any(f == path for f in matcher._files)

617

self._always = any(f == path for f in matcher._files)

618

619

def bad(self, f, msg):

619

def bad(self, f, msg):

620

self._matcher.bad(self._path + "/" + f, msg)

620

self._matcher.bad(self._path + "/" + f, msg)

621

622

def abs(self, f):

622

def abs(self, f):

623

return self._matcher.abs(self._path + "/" + f)

623

return self._matcher.abs(self._path + "/" + f)

624

625

def rel(self, f):

625

def rel(self, f):

626

return self._matcher.rel(self._path + "/" + f)

626

return self._matcher.rel(self._path + "/" + f)

627

628

def uipath(self, f):

628

def uipath(self, f):

629

return self._matcher.uipath(self._path + "/" + f)

629

return self._matcher.uipath(self._path + "/" + f)

630

631

def matchfn(self, f):

631

def matchfn(self, f):

632

# Some information is lost in the superclass's constructor, so we

632

# Some information is lost in the superclass's constructor, so we

633

# can not accurately create the matching function for the subdirectory

633

# can not accurately create the matching function for the subdirectory

634

# from the inputs. Instead, we override matchfn() and visitdir() to

634

# from the inputs. Instead, we override matchfn() and visitdir() to

635

# call the original matcher with the subdirectory path prepended.

635

# call the original matcher with the subdirectory path prepended.

636

return self._matcher.matchfn(self._path + "/" + f)

636

return self._matcher.matchfn(self._path + "/" + f)

637

638

def visitdir(self, dir):

638

def visitdir(self, dir):

639

if dir == '.':

639

if dir == '.':

640

dir = self._path

640

dir = self._path

641

else:

641

else:

642

dir = self._path + "/" + dir

642

dir = self._path + "/" + dir

643

return self._matcher.visitdir(dir)

643

return self._matcher.visitdir(dir)

644

645

def always(self):

645

def always(self):

646

return self._always

646

return self._always

647

648

def prefix(self):

648

def prefix(self):

649

return self._matcher.prefix() and not self._always

649

return self._matcher.prefix() and not self._always

650

651

@encoding.strmethod

651

@encoding.strmethod

652

def __repr__(self):

652

def __repr__(self):

653

return ('<subdirmatcher path=%r, matcher=%r>' %

653

return ('<subdirmatcher path=%r, matcher=%r>' %

654

(self._path, self._matcher))

654

(self._path, self._matcher))

655

656

class unionmatcher(basematcher):

656

class unionmatcher(basematcher):

657

"""A matcher that is the union of several matchers.

657

"""A matcher that is the union of several matchers.

658

659

The non-matching-attributes (root, cwd, bad, explicitdir, traversedir) are

659

The non-matching-attributes (root, cwd, bad, explicitdir, traversedir) are

660

taken from the first matcher.

660

taken from the first matcher.

661

"""

661

"""

662

663

def __init__(self, matchers):

663

def __init__(self, matchers):

664

m1 = matchers[0]

664

m1 = matchers[0]

665

super(unionmatcher, self).__init__(m1._root, m1._cwd)

665

super(unionmatcher, self).__init__(m1._root, m1._cwd)

666

self.explicitdir = m1.explicitdir

666

self.explicitdir = m1.explicitdir

667

self.traversedir = m1.traversedir

667

self.traversedir = m1.traversedir

668

self._matchers = matchers

668

self._matchers = matchers

669

670

def matchfn(self, f):

670

def matchfn(self, f):

671

for match in self._matchers:

671

for match in self._matchers:

672

if match(f):

672

if match(f):

673

return True

673

return True

674

return False

674

return False

675

676

def visitdir(self, dir):

676

def visitdir(self, dir):

677

r = False

677

r = False

678

for m in self._matchers:

678

for m in self._matchers:

679

v = m.visitdir(dir)

679

v = m.visitdir(dir)

680

if v == 'all':

680

if v == 'all':

681

return v

681

return v

682

r |= v

682

r |= v

683

return r

683

return r

684

685

@encoding.strmethod

685

@encoding.strmethod

686

def __repr__(self):

686

def __repr__(self):

687

return ('<unionmatcher matchers=%r>' % self._matchers)

687

return ('<unionmatcher matchers=%r>' % self._matchers)

688

689

def patkind(pattern, default=None):

689

def patkind(pattern, default=None):

690

'''If pattern is 'kind:pat' with a known kind, return kind.'''

690

'''If pattern is 'kind:pat' with a known kind, return kind.'''

691

return _patsplit(pattern, default)[0]

691

return _patsplit(pattern, default)[0]

692

693

def _patsplit(pattern, default):

693

def _patsplit(pattern, default):

694

"""Split a string into the optional pattern kind prefix and the actual

694

"""Split a string into the optional pattern kind prefix and the actual

695

pattern."""

695

pattern."""

696

if ':' in pattern:

696

if ':' in pattern:

697

kind, pat = pattern.split(':', 1)

697

kind, pat = pattern.split(':', 1)

698

if kind in allpatternkinds:

698

if kind in allpatternkinds:

699

return kind, pat

699

return kind, pat

700

return default, pattern

700

return default, pattern

701

702

def _globre(pat):

702

def _globre(pat):

703

r'''Convert an extended glob string to a regexp string.

703

r'''Convert an extended glob string to a regexp string.

704

705

>>> from . import pycompat

705

>>> from . import pycompat

706

>>> def bprint(s):

706

>>> def bprint(s):

707

... print(pycompat.sysstr(s))

707

... print(pycompat.sysstr(s))

708

>>> bprint(_globre(br'?'))

708

>>> bprint(_globre(br'?'))

709

.

709

.

710

>>> bprint(_globre(br'*'))

710

>>> bprint(_globre(br'*'))

711

[^/]*

711

[^/]*

712

>>> bprint(_globre(br'**'))

712

>>> bprint(_globre(br'**'))

713

.*

713

.*

714

>>> bprint(_globre(br'**/a'))

714

>>> bprint(_globre(br'**/a'))

715

(?:.*/)?a

715

(?:.*/)?a

716

>>> bprint(_globre(br'a/**/b'))

716

>>> bprint(_globre(br'a/**/b'))

717

a\/(?:.*/)?b

717

a\/(?:.*/)?b

718

>>> bprint(_globre(br'[a*?!^][^b][!c]'))

718

>>> bprint(_globre(br'[a*?!^][^b][!c]'))

719

[a*?!^][\^b][^c]

719

[a*?!^][\^b][^c]

720

>>> bprint(_globre(br'{a,b}'))

720

>>> bprint(_globre(br'{a,b}'))

721

(?:a|b)

721

(?:a|b)

722

>>> bprint(_globre(br'.\*\?'))

722

>>> bprint(_globre(br'.\*\?'))

723

\.\*\?

723

\.\*\?

724

'''

724

'''

725

i, n = 0, len(pat)

725

i, n = 0, len(pat)

726

res = ''

726

res = ''

727

group = 0

727

group = 0

728

escape = util.re.escape

728

escape = util.re.escape

729

def peek():

729

def peek():

730

return i < n and pat[i:i + 1]

730

return i < n and pat[i:i + 1]

731

while i < n:

731

while i < n:

732

c = pat[i:i + 1]

732

c = pat[i:i + 1]

733

i += 1

733

i += 1

734

if c not in '*?[{},\\':

734

if c not in '*?[{},\\':

735

res += escape(c)

735

res += escape(c)

736

elif c == '*':

736

elif c == '*':

737

if peek() == '*':

737

if peek() == '*':

738

i += 1

738

i += 1

739

if peek() == '/':

739

if peek() == '/':

740

i += 1

740

i += 1

741

res += '(?:.*/)?'

741

res += '(?:.*/)?'

742

else:

742

else:

743

res += '.*'

743

res += '.*'

744

else:

744

else:

745

res += '[^/]*'

745

res += '[^/]*'

746

elif c == '?':

746

elif c == '?':

747

res += '.'

747

res += '.'

748

elif c == '[':

748

elif c == '[':

749

j = i

749

j = i

750

if j < n and pat[j:j + 1] in '!]':

750

if j < n and pat[j:j + 1] in '!]':

751

j += 1

751

j += 1

752

while j < n and pat[j:j + 1] != ']':

752

while j < n and pat[j:j + 1] != ']':

753

j += 1

753

j += 1

754

if j >= n:

754

if j >= n:

755

res += '\\['

755

res += '\\['

756

else:

756

else:

757

stuff = pat[i:j].replace('\\','\\\\')

757

stuff = pat[i:j].replace('\\','\\\\')

758

i = j + 1

758

i = j + 1

759

if stuff[0:1] == '!':

759

if stuff[0:1] == '!':

760

stuff = '^' + stuff[1:]

760

stuff = '^' + stuff[1:]

761

elif stuff[0:1] == '^':

761

elif stuff[0:1] == '^':

762

stuff = '\\' + stuff

762

stuff = '\\' + stuff

763

res = '%s[%s]' % (res, stuff)

763

res = '%s[%s]' % (res, stuff)

764

elif c == '{':

764

elif c == '{':

765

group += 1

765

group += 1

766

res += '(?:'

766

res += '(?:'

767

elif c == '}' and group:

767

elif c == '}' and group:

768

res += ')'

768

res += ')'

769

group -= 1

769

group -= 1

770

elif c == ',' and group:

770

elif c == ',' and group:

771

res += '|'

771

res += '|'

772

elif c == '\\':

772

elif c == '\\':

773

p = peek()

773

p = peek()

774

if p:

774

if p:

775

i += 1

775

i += 1

776

res += escape(p)

776

res += escape(p)

777

else:

777

else:

778

res += escape(c)

778

res += escape(c)

779

else:

779

else:

780

res += escape(c)

780

res += escape(c)

781

return res

781

return res

782

783

def _regex(kind, pat, globsuffix):

783

def _regex(kind, pat, globsuffix):

784

'''Convert a (normalized) pattern of any kind into a regular expression.

784

'''Convert a (normalized) pattern of any kind into a regular expression.

785

globsuffix is appended to the regexp of globs.'''

785

globsuffix is appended to the regexp of globs.'''

786

if not pat:

786

if not pat:

787

return ''

787

return ''

788

if kind == 're':

788

if kind == 're':

789

return pat

789

return pat

790

if kind in ('path', 'relpath'):

790

if kind in ('path', 'relpath'):

791

if pat == '.':

791

if pat == '.':

792

return ''

792

return ''

793

return util.re.escape(pat) + '(?:/|$)'

793

return util.re.escape(pat) + '(?:/|$)'

794

if kind == 'rootfilesin':

794

if kind == 'rootfilesin':

795

if pat == '.':

795

if pat == '.':

796

escaped = ''

796

escaped = ''

797

else:

797

else:

798

# Pattern is a directory name.

798

# Pattern is a directory name.

799

escaped = util.re.escape(pat) + '/'

799

escaped = util.re.escape(pat) + '/'

800

# Anything after the pattern must be a non-directory.

800

# Anything after the pattern must be a non-directory.

801

return escaped + '[^/]+$'

801

return escaped + '[^/]+$'

802

if kind == 'relglob':

802

if kind == 'relglob':

803

return '(?:|.*/)' + _globre(pat) + globsuffix

803

return '(?:|.*/)' + _globre(pat) + globsuffix

804

if kind == 'relre':

804

if kind == 'relre':

805

if pat.startswith('^'):

805

if pat.startswith('^'):

806

return pat

806

return pat

807

return '.*' + pat

807

return '.*' + pat

808

return _globre(pat) + globsuffix

808

return _globre(pat) + globsuffix

809

810

def _buildmatch(ctx, kindpats, globsuffix, listsubrepos, root):

810

def _buildmatch(ctx, kindpats, globsuffix, listsubrepos, root):

811

'''Return regexp string and a matcher function for kindpats.

811

'''Return regexp string and a matcher function for kindpats.

812

globsuffix is appended to the regexp of globs.'''

812

globsuffix is appended to the regexp of globs.'''

813

matchfuncs = []

813

matchfuncs = []

814

815

subincludes, kindpats = _expandsubinclude(kindpats, root)

815

subincludes, kindpats = _expandsubinclude(kindpats, root)

816

if subincludes:

816

if subincludes:

817

submatchers = {}

817

submatchers = {}

818

def matchsubinclude(f):

818

def matchsubinclude(f):

819

for prefix, matcherargs in subincludes:

819

for prefix, matcherargs in subincludes:

820

if f.startswith(prefix):

820

if f.startswith(prefix):

821

mf = submatchers.get(prefix)

821

mf = submatchers.get(prefix)

822

if mf is None:

822

if mf is None:

823

mf = match(*matcherargs)

823

mf = match(*matcherargs)

824

submatchers[prefix] = mf

824

submatchers[prefix] = mf

825

826

if mf(f[len(prefix):]):

826

if mf(f[len(prefix):]):

827

return True

827

return True

828

return False

828

return False

829

matchfuncs.append(matchsubinclude)

829

matchfuncs.append(matchsubinclude)

830

831

fset, kindpats = _expandsets(kindpats, ctx, listsubrepos)

831

fset, kindpats = _expandsets(kindpats, ctx, listsubrepos)

832

if fset:

832

if fset:

833

matchfuncs.append(fset.__contains__)

833

matchfuncs.append(fset.__contains__)

834

835

regex = ''

835

regex = ''

836

if kindpats:

836

if kindpats:

837

regex, mf = _buildregexmatch(kindpats, globsuffix)

837

regex, mf = _buildregexmatch(kindpats, globsuffix)

838

matchfuncs.append(mf)

838

matchfuncs.append(mf)

839

840

if len(matchfuncs) == 1:

840

if len(matchfuncs) == 1:

841

return regex, matchfuncs[0]

841

return regex, matchfuncs[0]

842

else:

842

else:

843

return regex, lambda f: any(mf(f) for mf in matchfuncs)

843

return regex, lambda f: any(mf(f) for mf in matchfuncs)

844

845

def _buildregexmatch(kindpats, globsuffix):

845

def _buildregexmatch(kindpats, globsuffix):

846

"""Build a match function from a list of kinds and kindpats,

846

"""Build a match function from a list of kinds and kindpats,

847

return regexp string and a matcher function."""

847

return regexp string and a matcher function."""

848

try:

848

try:

849

regex = '(?:%s)' % '|'.join([_regex(k, p, globsuffix)

849

regex = '(?:%s)' % '|'.join([_regex(k, p, globsuffix)

850

for (k, p, s) in kindpats])

850

for (k, p, s) in kindpats])

851

if len(regex) > 20000:

851

if len(regex) > 20000:

852

raise OverflowError

852

raise OverflowError

853

return regex, _rematcher(regex)

853

return regex, _rematcher(regex)

854

except OverflowError:

854

except OverflowError:

855

# We're using a Python with a tiny regex engine and we

855

# We're using a Python with a tiny regex engine and we

856

# made it explode, so we'll divide the pattern list in two

856

# made it explode, so we'll divide the pattern list in two

857

# until it works

857

# until it works

858

l = len(kindpats)

858

l = len(kindpats)

859

if l < 2:

859

if l < 2:

860

raise

860

raise

861

regexa, a = _buildregexmatch(kindpats[:l//2], globsuffix)

861

regexa, a = _buildregexmatch(kindpats[:l//2], globsuffix)

862

regexb, b = _buildregexmatch(kindpats[l//2:], globsuffix)

862

regexb, b = _buildregexmatch(kindpats[l//2:], globsuffix)

863

return regex, lambda s: a(s) or b(s)

863

return regex, lambda s: a(s) or b(s)

864

except re.error:

864

except re.error:

865

for k, p, s in kindpats:

865

for k, p, s in kindpats:

866

try:

866

try:

867

_rematcher('(?:%s)' % _regex(k, p, globsuffix))

867

_rematcher('(?:%s)' % _regex(k, p, globsuffix))

868

except re.error:

868

except re.error:

869

if s:

869

if s:

870

raise error.Abort(_("%s: invalid pattern (%s): %s") %

870

raise error.Abort(_("%s: invalid pattern (%s): %s") %

871

(s, k, p))

871

(s, k, p))

872

else:

872

else:

873

raise error.Abort(_("invalid pattern (%s): %s") % (k, p))

873

raise error.Abort(_("invalid pattern (%s): %s") % (k, p))

874

raise error.Abort(_("invalid pattern"))

874

raise error.Abort(_("invalid pattern"))

875

876

def _patternrootsanddirs(kindpats):

876

def _patternrootsanddirs(kindpats):

877

'''Returns roots and directories corresponding to each pattern.

877

'''Returns roots and directories corresponding to each pattern.

878

879

This calculates the roots and directories exactly matching the patterns and

879

This calculates the roots and directories exactly matching the patterns and

880

returns a tuple of (roots, dirs) for each. It does not return other

880

returns a tuple of (roots, dirs) for each. It does not return other

881

directories which may also need to be considered, like the parent

881

directories which may also need to be considered, like the parent

882

directories.

882

directories.

883

'''

883

'''

884

r = []

884

r = []

885

d = []

885

d = []

886

for kind, pat, source in kindpats:

886

for kind, pat, source in kindpats:

887

if kind == 'glob': # find the non-glob prefix

887

if kind == 'glob': # find the non-glob prefix

888

root = []

888

root = []

889

for p in pat.split('/'):

889

for p in pat.split('/'):

890

if '[' in p or '{' in p or '*' in p or '?' in p:

890

if '[' in p or '{' in p or '*' in p or '?' in p:

891

break

891

break

892

root.append(p)

892

root.append(p)

893

r.append('/'.join(root) or '.')

893

r.append('/'.join(root) or '.')

894

elif kind in ('relpath', 'path'):

894

elif kind in ('relpath', 'path'):

895

r.append(pat or '.')

895

r.append(pat or '.')

896

elif kind in ('rootfilesin',):

896

elif kind in ('rootfilesin',):

897

d.append(pat or '.')

897

d.append(pat or '.')

898

else: # relglob, re, relre

898

else: # relglob, re, relre

899

r.append('.')

899

r.append('.')

900

return r, d

900

return r, d

901

902

def _roots(kindpats):

902

def _roots(kindpats):

903

'''Returns root directories to match recursively from the given patterns.'''

903

'''Returns root directories to match recursively from the given patterns.'''

904

roots, dirs = _patternrootsanddirs(kindpats)

904

roots, dirs = _patternrootsanddirs(kindpats)

905

return roots

905

return roots

906

907

def _rootsanddirs(kindpats):

907

def _rootsanddirs(kindpats):

908

'''Returns roots and exact directories from patterns.

908

'''Returns roots and exact directories from patterns.

909

910

roots are directories to match recursively, whereas exact directories should

910

roots are directories to match recursively, whereas exact directories should

911

be matched non-recursively. The returned (roots, dirs) tuple will also

911

be matched non-recursively. The returned (roots, dirs) tuple will also

912

include directories that need to be implicitly considered as either, such as

912

include directories that need to be implicitly considered as either, such as

913

parent directories.

913

parent directories.

914

915

>>> _rootsanddirs(

915

>>> _rootsanddirs(

916

... [(b'glob', b'g/h/*', b''), (b'glob', b'g/h', b''),

916

... [(b'glob', b'g/h/*', b''), (b'glob', b'g/h', b''),

917

... (b'glob', b'g*', b'')])

917

... (b'glob', b'g*', b'')])

918

(['g/h', 'g/h', '.'], ['g', '.'])

918

(['g/h', 'g/h', '.'], ['g', '.'])

919

>>> _rootsanddirs(

919

>>> _rootsanddirs(

920

... [(b'rootfilesin', b'g/h', b''), (b'rootfilesin', b'', b'')])

920

... [(b'rootfilesin', b'g/h', b''), (b'rootfilesin', b'', b'')])

921

([], ['g/h', '.', 'g', '.'])

921

([], ['g/h', '.', 'g', '.'])

922

>>> _rootsanddirs(

922

>>> _rootsanddirs(

923

... [(b'relpath', b'r', b''), (b'path', b'p/p', b''),

923

... [(b'relpath', b'r', b''), (b'path', b'p/p', b''),

924

... (b'path', b'', b'')])

924

... (b'path', b'', b'')])

925

(['r', 'p/p', '.'], ['p', '.'])

925

(['r', 'p/p', '.'], ['p', '.'])

926

>>> _rootsanddirs(

926

>>> _rootsanddirs(

927

... [(b'relglob', b'rg*', b''), (b're', b're/', b''),

927

... [(b'relglob', b'rg*', b''), (b're', b're/', b''),

928

... (b'relre', b'rr', b'')])

928

... (b'relre', b'rr', b'')])

929

(['.', '.', '.'], ['.'])

929

(['.', '.', '.'], ['.'])

930

'''

930

'''

931

r, d = _patternrootsanddirs(kindpats)

931

r, d = _patternrootsanddirs(kindpats)

932

933

# Append the parents as non-recursive/exact directories, since they must be

933

# Append the parents as non-recursive/exact directories, since they must be

934

# scanned to get to either the roots or the other exact directories.

934

# scanned to get to either the roots or the other exact directories.

935

d.extend(util.dirs(d))

935

d.extend(util.dirs(d))

936

d.extend(util.dirs(r))

936

d.extend(util.dirs(r))

937

# util.dirs() does not include the root directory, so add it manually

937

# util.dirs() does not include the root directory, so add it manually

938

d.append('.')

938

d.append('.')

939

940

return r, d

940

return r, d

941

942

def _explicitfiles(kindpats):

942

def _explicitfiles(kindpats):

943

'''Returns the potential explicit filenames from the patterns.

943

'''Returns the potential explicit filenames from the patterns.

944

945

>>> _explicitfiles([(b'path', b'foo/bar', b'')])

945

>>> _explicitfiles([(b'path', b'foo/bar', b'')])

946

['foo/bar']

946

['foo/bar']

947

>>> _explicitfiles([(b'rootfilesin', b'foo/bar', b'')])

947

>>> _explicitfiles([(b'rootfilesin', b'foo/bar', b'')])

948

[]

948

[]

949

'''

949

'''

950

# Keep only the pattern kinds where one can specify filenames (vs only

950

# Keep only the pattern kinds where one can specify filenames (vs only

951

# directory names).

951

# directory names).

952

filable = [kp for kp in kindpats if kp[0] not in ('rootfilesin',)]

952

filable = [kp for kp in kindpats if kp[0] not in ('rootfilesin',)]

953

return _roots(filable)

953

return _roots(filable)

954

955

def _prefix(kindpats):

955

def _prefix(kindpats):

956

'''Whether all the patterns match a prefix (i.e. recursively)'''

956

'''Whether all the patterns match a prefix (i.e. recursively)'''

957

for kind, pat, source in kindpats:

957

for kind, pat, source in kindpats:

958

if kind not in ('path', 'relpath'):

958

if kind not in ('path', 'relpath'):

959

return False

959

return False

960

return True

960

return True

961

962

_commentre = None

962

_commentre = None

963

964

def readpatternfile(filepath, warn, sourceinfo=False):

964

def readpatternfile(filepath, warn, sourceinfo=False):

965

'''parse a pattern file, returning a list of

965

'''parse a pattern file, returning a list of

966

patterns. These patterns should be given to compile()

966

patterns. These patterns should be given to compile()

967

to be validated and converted into a match function.

967

to be validated and converted into a match function.

968

969

trailing white space is dropped.

969

trailing white space is dropped.

970

the escape character is backslash.

970

the escape character is backslash.

971

comments start with #.

971

comments start with #.

972

empty lines are skipped.

972

empty lines are skipped.

973

974

lines can be of the following formats:

974

lines can be of the following formats:

975

976

syntax: regexp # defaults following lines to non-rooted regexps

976

syntax: regexp # defaults following lines to non-rooted regexps

977

syntax: glob # defaults following lines to non-rooted globs

977

syntax: glob # defaults following lines to non-rooted globs

978

re:pattern # non-rooted regular expression

978

re:pattern # non-rooted regular expression

979

glob:pattern # non-rooted glob

979

glob:pattern # non-rooted glob

980

pattern # pattern of the current default type

980

pattern # pattern of the current default type

981

982

if sourceinfo is set, returns a list of tuples:

982

if sourceinfo is set, returns a list of tuples:

983

(pattern, lineno, originalline). This is useful to debug ignore patterns.

983

(pattern, lineno, originalline). This is useful to debug ignore patterns.

984

'''

984

'''

985

986

syntaxes = {'re': 'relre:', 'regexp': 'relre:', 'glob': 'relglob:',

986

syntaxes = {'re': 'relre:', 'regexp': 'relre:', 'glob': 'relglob:',

987

'include': 'include', 'subinclude': 'subinclude'}

987

'include': 'include', 'subinclude': 'subinclude'}

988

syntax = 'relre:'

988

syntax = 'relre:'

989

patterns = []

989

patterns = []

990

991

fp = open(filepath, 'rb')

991

fp = open(filepath, 'rb')

992

for lineno, line in enumerate(util.iterfile(fp), start=1):

992

for lineno, line in enumerate(util.iterfile(fp), start=1):

993

if "#" in line:

993

if "#" in line:

994

global _commentre

994

global _commentre

995

if not _commentre:

995

if not _commentre:

996

_commentre = util.re.compile(br'((?:^|[^\\])(?:\\\\)*)#.*')

996

_commentre = util.re.compile(br'((?:^|[^\\])(?:\\\\)*)#.*')

997

# remove comments prefixed by an even number of escapes

997

# remove comments prefixed by an even number of escapes

998

m = _commentre.search(line)

998

m = _commentre.search(line)

999

if m:

999

if m:

1000

line = line[:m.end(1)]

1000

line = line[:m.end(1)]

1001

# fixup properly escaped comments that survived the above

1001

# fixup properly escaped comments that survived the above

1002

line = line.replace("\\#", "#")

1002

line = line.replace("\\#", "#")

1003

line = line.rstrip()

1003

line = line.rstrip()

1004

if not line:

1004

if not line:

1005

continue

1005

continue

1006

1007

if line.startswith('syntax:'):

1007

if line.startswith('syntax:'):

1008

s = line[7:].strip()

1008

s = line[7:].strip()

1009

try:

1009

try:

1010

syntax = syntaxes[s]

1010

syntax = syntaxes[s]

1011

except KeyError:

1011

except KeyError:

1012

if warn:

1012

if warn:

1013

warn(_("%s: ignoring invalid syntax '%s'\n") %

1013

warn(_("%s: ignoring invalid syntax '%s'\n") %

1014

(filepath, s))

1014

(filepath, s))

1015

continue

1015

continue

1016

1017

linesyntax = syntax

1017

linesyntax = syntax

1018

for s, rels in syntaxes.iteritems():

1018

for s, rels in syntaxes.iteritems():

1019

if line.startswith(rels):

1019

if line.startswith(rels):

1020

linesyntax = rels

1020

linesyntax = rels

1021

line = line[len(rels):]

1021

line = line[len(rels):]

1022

break

1022

break

1023

elif line.startswith(s+':'):

1023

elif line.startswith(s+':'):

1024

linesyntax = rels

1024

linesyntax = rels

1025

line = line[len(s) + 1:]

1025

line = line[len(s) + 1:]

1026

break

1026

break

1027

if sourceinfo:

1027

if sourceinfo:

1028

patterns.append((linesyntax + line, lineno, line))

1028

patterns.append((linesyntax + line, lineno, line))

1029

else:

1029

else:

1030

patterns.append(linesyntax + line)

1030

patterns.append(linesyntax + line)

1031

fp.close()

1031

fp.close()

1032

return patterns

1032

return patterns

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # match.py - filename matching
             #
             #  Copyright 2008, 2009 Matt Mackall <mpm@selenic.com> and others
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import, print_function
             import copy
             import os
             import re
             from .i18n import _
             from . import (
                 encoding,
                 error,
                 pathutil,
                 pycompat,
                 util,
             )
             from .utils import (
                 stringutil,
             )
             allpatternkinds = ('re', 'glob', 'path', 'relglob', 'relpath', 'relre',
                                'listfile', 'listfile0', 'set', 'include', 'subinclude',
                                'rootfilesin')
             cwdrelativepatternkinds = ('relpath', 'glob')
             propertycache = util.propertycache
             def _rematcher(regex):
                 '''compile the regexp with the best available regexp engine and return a
                 matcher function'''
                 m = util.re.compile(regex)
                 try:
                     # slightly faster, provided by facebook's re2 bindings
                     return m.test_match
                 except AttributeError:
                     return m.match
             def _expandsets(kindpats, ctx, listsubrepos):
                 '''Returns the kindpats list with the 'set' patterns expanded.'''
                 fset = set()
                 other = []
                 for kind, pat, source in kindpats:
                     if kind == 'set':
                         if not ctx:
                             raise error.ProgrammingError("fileset expression with no "
                                                          "context")
                         s = ctx.getfileset(pat)
                         fset.update(s)
                         if listsubrepos:
                             for subpath in ctx.substate:
                                 s = ctx.sub(subpath).getfileset(pat)
                                 fset.update(subpath + '/' + f for f in s)
                         continue
                     other.append((kind, pat, source))
                 return fset, other
             def _expandsubinclude(kindpats, root):
                 '''Returns the list of subinclude matcher args and the kindpats without the
                 subincludes in it.'''
                 relmatchers = []
                 other = []
                 for kind, pat, source in kindpats:
                     if kind == 'subinclude':
                         sourceroot = pathutil.dirname(util.normpath(source))
                         pat = util.pconvert(pat)
                         path = pathutil.join(sourceroot, pat)
                         newroot = pathutil.dirname(path)
                         matcherargs = (newroot, '', [], ['include:%s' % path])
                         prefix = pathutil.canonpath(root, root, newroot)
                         if prefix:
                             prefix += '/'
                         relmatchers.append((prefix, matcherargs))
                     else:
                         other.append((kind, pat, source))
                 return relmatchers, other
             def _kindpatsalwaysmatch(kindpats):
                 """"Checks whether the kindspats match everything, as e.g.
                 'relpath:.' does.
                 """
                 for kind, pat, source in kindpats:
                     if pat != '' or kind not in ['relpath', 'glob']:
                         return False
                 return True
             def match(root, cwd, patterns=None, include=None, exclude=None, default='glob',
                       exact=False, auditor=None, ctx=None, listsubrepos=False, warn=None,
                       badfn=None, icasefs=False):
                 """build an object to match a set of file patterns
                 arguments:
                 root - the canonical root of the tree you're matching against
                 cwd - the current working directory, if relevant
                 patterns - patterns to find
                 include - patterns to include (unless they are excluded)
                 exclude - patterns to exclude (even if they are included)
                 default - if a pattern in patterns has no explicit type, assume this one
                 exact - patterns are actually filenames (include/exclude still apply)
                 warn - optional function used for printing warnings
                 badfn - optional bad() callback for this matcher instead of the default
                 icasefs - make a matcher for wdir on case insensitive filesystems, which
                     normalizes the given patterns to the case in the filesystem
                 a pattern is one of:
                 'glob:<glob>' - a glob relative to cwd
                 're:<regexp>' - a regular expression
                 'path:<path>' - a path relative to repository root, which is matched
                                 recursively
                 'rootfilesin:<path>' - a path relative to repository root, which is
                                 matched non-recursively (will not match subdirectories)
                 'relglob:<glob>' - an unrooted glob (*.c matches C files in all dirs)
                 'relpath:<path>' - a path relative to cwd
                 'relre:<regexp>' - a regexp that needn't match the start of a name
                 'set:<fileset>' - a fileset expression
                 'include:<path>' - a file of patterns to read and include
                 'subinclude:<path>' - a file of patterns to match against files under
                                       the same directory
                 '<something>' - a pattern of the specified default type
                 """
                 normalize = _donormalize
                 if icasefs:
                     if exact:
                         raise error.ProgrammingError("a case-insensitive exact matcher "
                                                      "doesn't make sense")
                     dirstate = ctx.repo().dirstate
                     dsnormalize = dirstate.normalize
                     def normalize(patterns, default, root, cwd, auditor, warn):
                         kp = _donormalize(patterns, default, root, cwd, auditor, warn)
                         kindpats = []
                         for kind, pats, source in kp:
                             if kind not in ('re', 'relre'):  # regex can't be normalized
                                 p = pats
                                 pats = dsnormalize(pats)
                                 # Preserve the original to handle a case only rename.
                                 if p != pats and p in dirstate:
                                     kindpats.append((kind, p, source))
                             kindpats.append((kind, pats, source))
                         return kindpats
                 if exact:
                     m = exactmatcher(root, cwd, patterns, badfn)
                 elif patterns:
                     kindpats = normalize(patterns, default, root, cwd, auditor, warn)
                     if _kindpatsalwaysmatch(kindpats):
                         m = alwaysmatcher(root, cwd, badfn, relativeuipath=True)
                     else:
                         m = patternmatcher(root, cwd, kindpats, ctx=ctx,
                                            listsubrepos=listsubrepos, badfn=badfn)
                 else:
                     # It's a little strange that no patterns means to match everything.
                     # Consider changing this to match nothing (probably using nevermatcher).
                     m = alwaysmatcher(root, cwd, badfn)
                 if include:
                     kindpats = normalize(include, 'glob', root, cwd, auditor, warn)
                     im = includematcher(root, cwd, kindpats, ctx=ctx,
                                         listsubrepos=listsubrepos, badfn=None)
                     m = intersectmatchers(m, im)
                 if exclude:
                     kindpats = normalize(exclude, 'glob', root, cwd, auditor, warn)
                     em = includematcher(root, cwd, kindpats, ctx=ctx,
                                         listsubrepos=listsubrepos, badfn=None)
                     m = differencematcher(m, em)
                 return m
             def exact(root, cwd, files, badfn=None):
                 return exactmatcher(root, cwd, files, badfn=badfn)
             def always(root, cwd):
                 return alwaysmatcher(root, cwd)
             def never(root, cwd):
                 return nevermatcher(root, cwd)
             def badmatch(match, badfn):
                 """Make a copy of the given matcher, replacing its bad method with the given
                 one.
                 """
                 m = copy.copy(match)
                 m.bad = badfn
                 return m
             def _donormalize(patterns, default, root, cwd, auditor, warn):
                 '''Convert 'kind:pat' from the patterns list to tuples with kind and
                 normalized and rooted patterns and with listfiles expanded.'''
                 kindpats = []
                 for kind, pat in [_patsplit(p, default) for p in patterns]:
                     if kind in cwdrelativepatternkinds:
                         pat = pathutil.canonpath(root, cwd, pat, auditor)
                     elif kind in ('relglob', 'path', 'rootfilesin'):
                         pat = util.normpath(pat)
                     elif kind in ('listfile', 'listfile0'):
                         try:
                             files = util.readfile(pat)
                             if kind == 'listfile0':
                                 files = files.split('\0')
                             else:
                                 files = files.splitlines()
                             files = [f for f in files if f]
                         except EnvironmentError:
                             raise error.Abort(_("unable to read file list (%s)") % pat)
                         for k, p, source in _donormalize(files, default, root, cwd,
                                                          auditor, warn):
                             kindpats.append((k, p, pat))
                         continue
                     elif kind == 'include':
                         try:
                             fullpath = os.path.join(root, util.localpath(pat))
                             includepats = readpatternfile(fullpath, warn)
                             for k, p, source in _donormalize(includepats, default,
                                                              root, cwd, auditor, warn):
                                 kindpats.append((k, p, source or pat))
                         except error.Abort as inst:
                             raise error.Abort('%s: %s' % (pat, inst[0]))
                         except IOError as inst:
                             if warn:
                                 warn(_("skipping unreadable pattern file '%s': %s\n") %
                                      (pat, stringutil.forcebytestr(inst.strerror)))
                         continue
                     # else: re or relre - which cannot be normalized
                     kindpats.append((kind, pat, ''))
                 return kindpats
             class basematcher(object):
                 def __init__(self, root, cwd, badfn=None, relativeuipath=True):
                     self._root = root
                     self._cwd = cwd
                     if badfn is not None:
                         self.bad = badfn
                     self._relativeuipath = relativeuipath
                 def __call__(self, fn):
                     return self.matchfn(fn)
                 def __iter__(self):
                     for f in self._files:
                         yield f
                 # Callbacks related to how the matcher is used by dirstate.walk.
                 # Subscribers to these events must monkeypatch the matcher object.
                 def bad(self, f, msg):
                     '''Callback from dirstate.walk for each explicit file that can't be
                     found/accessed, with an error message.'''
                 # If an explicitdir is set, it will be called when an explicitly listed
                 # directory is visited.
                 explicitdir = None
                 # If an traversedir is set, it will be called when a directory discovered
                 # by recursive traversal is visited.
                 traversedir = None
                 def abs(self, f):
                     '''Convert a repo path back to path that is relative to the root of the
                     matcher.'''
                     return f
                 def rel(self, f):
                     '''Convert repo path back to path that is relative to cwd of matcher.'''
                     return util.pathto(self._root, self._cwd, f)
                 def uipath(self, f):
                     '''Convert repo path to a display path.  If patterns or -I/-X were used
                     to create this matcher, the display path will be relative to cwd.
                     Otherwise it is relative to the root of the repo.'''
                     return (self._relativeuipath and self.rel(f)) or self.abs(f)
                 @propertycache
                 def _files(self):
                     return []
                 def files(self):
                     '''Explicitly listed files or patterns or roots:
                     if no patterns or .always(): empty list,
                     if exact: list exact files,
                     if not .anypats(): list all files and dirs,
                     else: optimal roots'''
                     return self._files
                 @propertycache
                 def _fileset(self):
                     return set(self._files)
                 def exact(self, f):
                     '''Returns True if f is in .files().'''
                     return f in self._fileset
                 def matchfn(self, f):
                     return False
                 def visitdir(self, dir):
                     '''Decides whether a directory should be visited based on whether it
                     has potential matches in it or one of its subdirectories. This is
                     based on the match's primary, included, and excluded patterns.
                     Returns the string 'all' if the given directory and all subdirectories
                     should be visited. Otherwise returns True or False indicating whether
                     the given directory should be visited.
                     '''
                     return True
                 def always(self):
                     '''Matcher will match everything and .files() will be empty --
                     optimization might be possible.'''
                     return False
                 def isexact(self):
                     '''Matcher will match exactly the list of files in .files() --
                     optimization might be possible.'''
                     return False
                 def prefix(self):
                     '''Matcher will match the paths in .files() recursively --
                     optimization might be possible.'''
                     return False
                 def anypats(self):
                     '''None of .always(), .isexact(), and .prefix() is true --
                     optimizations will be difficult.'''
                     return not self.always() and not self.isexact() and not self.prefix()
             class alwaysmatcher(basematcher):
                 '''Matches everything.'''
                 def __init__(self, root, cwd, badfn=None, relativeuipath=False):
                     super(alwaysmatcher, self).__init__(root, cwd, badfn,
                                                         relativeuipath=relativeuipath)
                 def always(self):
                     return True
                 def matchfn(self, f):
                     return True
                 def visitdir(self, dir):
                     return 'all'
                 def __repr__(self):
                     return r'<alwaysmatcher>'
             class nevermatcher(basematcher):
                 '''Matches nothing.'''
                 def __init__(self, root, cwd, badfn=None):
                     super(nevermatcher, self).__init__(root, cwd, badfn)
                 # It's a little weird to say that the nevermatcher is an exact matcher
                 # or a prefix matcher, but it seems to make sense to let callers take
                 # fast paths based on either. There will be no exact matches, nor any
                 # prefixes (files() returns []), so fast paths iterating over them should
                 # be efficient (and correct).
                 def isexact(self):
                     return True
                 def prefix(self):
                     return True
                 def visitdir(self, dir):
                     return False
                 def __repr__(self):
                     return r'<nevermatcher>'
             class patternmatcher(basematcher):
                 def __init__(self, root, cwd, kindpats, ctx=None, listsubrepos=False,
                              badfn=None):
                     super(patternmatcher, self).__init__(root, cwd, badfn)
                     self._files = _explicitfiles(kindpats)
                     self._prefix = _prefix(kindpats)
                     self._pats, self.matchfn = _buildmatch(ctx, kindpats, '$', listsubrepos,
                                                            root)
                 @propertycache
                 def _dirs(self):
                     return set(util.dirs(self._fileset)) | {'.'}
                 def visitdir(self, dir):
                     if self._prefix and dir in self._fileset:
                         return 'all'
                     return ('.' in self._fileset or
                             dir in self._fileset or
                             dir in self._dirs or
                             any(parentdir in self._fileset
                                 for parentdir in util.finddirs(dir)))
                 def prefix(self):
                     return self._prefix
                 @encoding.strmethod
                 def __repr__(self):
-                    return ('<patternmatcher patterns=%r>' % self._pats)
+                    return ('<patternmatcher patterns=%r>' % pycompat.bytestr(self._pats))
             class includematcher(basematcher):
                 def __init__(self, root, cwd, kindpats, ctx=None, listsubrepos=False,
                              badfn=None):
                     super(includematcher, self).__init__(root, cwd, badfn)
                     self._pats, self.matchfn = _buildmatch(ctx, kindpats, '(?:/|$)',
                                                            listsubrepos, root)
                     self._prefix = _prefix(kindpats)
                     roots, dirs = _rootsanddirs(kindpats)
                     # roots are directories which are recursively included.
                     self._roots = set(roots)
                     # dirs are directories which are non-recursively included.
                     self._dirs = set(dirs)
                 def visitdir(self, dir):
                     if self._prefix and dir in self._roots:
                         return 'all'
                     return ('.' in self._roots or
                             dir in self._roots or
                             dir in self._dirs or
                             any(parentdir in self._roots
                                 for parentdir in util.finddirs(dir)))
                 @encoding.strmethod
                 def __repr__(self):
                     return ('<includematcher includes=%r>' % pycompat.bytestr(self._pats))
             class exactmatcher(basematcher):
                 '''Matches the input files exactly. They are interpreted as paths, not
                 patterns (so no kind-prefixes).
                 '''
                 def __init__(self, root, cwd, files, badfn=None):
                     super(exactmatcher, self).__init__(root, cwd, badfn)
                     if isinstance(files, list):
                         self._files = files
                     else:
                         self._files = list(files)
                 matchfn = basematcher.exact
                 @propertycache
                 def _dirs(self):
                     return set(util.dirs(self._fileset)) | {'.'}
                 def visitdir(self, dir):
                     return dir in self._dirs
                 def isexact(self):
                     return True
                 @encoding.strmethod
                 def __repr__(self):
                     return ('<exactmatcher files=%r>' % self._files)
             class differencematcher(basematcher):
                 '''Composes two matchers by matching if the first matches and the second
                 does not.
                 The second matcher's non-matching-attributes (root, cwd, bad, explicitdir,
                 traversedir) are ignored.
                 '''
                 def __init__(self, m1, m2):
                     super(differencematcher, self).__init__(m1._root, m1._cwd)
                     self._m1 = m1
                     self._m2 = m2
                     self.bad = m1.bad
                     self.explicitdir = m1.explicitdir
                     self.traversedir = m1.traversedir
                 def matchfn(self, f):
                     return self._m1(f) and not self._m2(f)
                 @propertycache
                 def _files(self):
                     if self.isexact():
                         return [f for f in self._m1.files() if self(f)]
                     # If m1 is not an exact matcher, we can't easily figure out the set of
                     # files, because its files() are not always files. For example, if
                     # m1 is "path:dir" and m2 is "rootfileins:.", we don't
                     # want to remove "dir" from the set even though it would match m2,
                     # because the "dir" in m1 may not be a file.
                     return self._m1.files()
                 def visitdir(self, dir):
                     if self._m2.visitdir(dir) == 'all':
                         return False
                     return bool(self._m1.visitdir(dir))
                 def isexact(self):
                     return self._m1.isexact()
                 @encoding.strmethod
                 def __repr__(self):
                     return ('<differencematcher m1=%r, m2=%r>' % (self._m1, self._m2))
             def intersectmatchers(m1, m2):
                 '''Composes two matchers by matching if both of them match.
                 The second matcher's non-matching-attributes (root, cwd, bad, explicitdir,
                 traversedir) are ignored.
                 '''
                 if m1 is None or m2 is None:
                     return m1 or m2
                 if m1.always():
                     m = copy.copy(m2)
                     # TODO: Consider encapsulating these things in a class so there's only
                     # one thing to copy from m1.
                     m.bad = m1.bad
                     m.explicitdir = m1.explicitdir
                     m.traversedir = m1.traversedir
                     m.abs = m1.abs
                     m.rel = m1.rel
                     m._relativeuipath |= m1._relativeuipath
                     return m
                 if m2.always():
                     m = copy.copy(m1)
                     m._relativeuipath |= m2._relativeuipath
                     return m
                 return intersectionmatcher(m1, m2)
             class intersectionmatcher(basematcher):
                 def __init__(self, m1, m2):
                     super(intersectionmatcher, self).__init__(m1._root, m1._cwd)
                     self._m1 = m1
                     self._m2 = m2
                     self.bad = m1.bad
                     self.explicitdir = m1.explicitdir
                     self.traversedir = m1.traversedir
                 @propertycache
                 def _files(self):
                     if self.isexact():
                         m1, m2 = self._m1, self._m2
                         if not m1.isexact():
                             m1, m2 = m2, m1
                         return [f for f in m1.files() if m2(f)]
                     # It neither m1 nor m2 is an exact matcher, we can't easily intersect
                     # the set of files, because their files() are not always files. For
                     # example, if intersecting a matcher "-I glob:foo.txt" with matcher of
                     # "path:dir2", we don't want to remove "dir2" from the set.
                     return self._m1.files() + self._m2.files()
                 def matchfn(self, f):
                     return self._m1(f) and self._m2(f)
                 def visitdir(self, dir):
                     visit1 = self._m1.visitdir(dir)
                     if visit1 == 'all':
                         return self._m2.visitdir(dir)
                     # bool() because visit1=True + visit2='all' should not be 'all'
                     return bool(visit1 and self._m2.visitdir(dir))
                 def always(self):
                     return self._m1.always() and self._m2.always()
                 def isexact(self):
                     return self._m1.isexact() or self._m2.isexact()
                 @encoding.strmethod
                 def __repr__(self):
                     return ('<intersectionmatcher m1=%r, m2=%r>' % (self._m1, self._m2))
             class subdirmatcher(basematcher):
                 """Adapt a matcher to work on a subdirectory only.
                 The paths are remapped to remove/insert the path as needed:
                 >>> from . import pycompat
                 >>> m1 = match(b'root', b'', [b'a.txt', b'sub/b.txt'])
                 >>> m2 = subdirmatcher(b'sub', m1)
                 >>> bool(m2(b'a.txt'))
                 False
                 >>> bool(m2(b'b.txt'))
                 True
                 >>> bool(m2.matchfn(b'a.txt'))
                 False
                 >>> bool(m2.matchfn(b'b.txt'))
                 True
                 >>> m2.files()
                 ['b.txt']
                 >>> m2.exact(b'b.txt')
                 True
                 >>> util.pconvert(m2.rel(b'b.txt'))
                 'sub/b.txt'
                 >>> def bad(f, msg):
                 ...     print(pycompat.sysstr(b"%s: %s" % (f, msg)))
                 >>> m1.bad = bad
                 >>> m2.bad(b'x.txt', b'No such file')
                 sub/x.txt: No such file
                 >>> m2.abs(b'c.txt')
                 'sub/c.txt'
                 """
                 def __init__(self, path, matcher):
                     super(subdirmatcher, self).__init__(matcher._root, matcher._cwd)
                     self._path = path
                     self._matcher = matcher
                     self._always = matcher.always()
                     self._files = [f[len(path) + 1:] for f in matcher._files
                                    if f.startswith(path + "/")]
                     # If the parent repo had a path to this subrepo and the matcher is
                     # a prefix matcher, this submatcher always matches.
                     if matcher.prefix():
                         self._always = any(f == path for f in matcher._files)
                 def bad(self, f, msg):
                     self._matcher.bad(self._path + "/" + f, msg)
                 def abs(self, f):
                     return self._matcher.abs(self._path + "/" + f)
                 def rel(self, f):
                     return self._matcher.rel(self._path + "/" + f)
                 def uipath(self, f):
                     return self._matcher.uipath(self._path + "/" + f)
                 def matchfn(self, f):
                     # Some information is lost in the superclass's constructor, so we
                     # can not accurately create the matching function for the subdirectory
                     # from the inputs. Instead, we override matchfn() and visitdir() to
                     # call the original matcher with the subdirectory path prepended.
                     return self._matcher.matchfn(self._path + "/" + f)
                 def visitdir(self, dir):
                     if dir == '.':
                         dir = self._path
                     else:
                         dir = self._path + "/" + dir
                     return self._matcher.visitdir(dir)
                 def always(self):
                     return self._always
                 def prefix(self):
                     return self._matcher.prefix() and not self._always
                 @encoding.strmethod
                 def __repr__(self):
                     return ('<subdirmatcher path=%r, matcher=%r>' %
                             (self._path, self._matcher))
             class unionmatcher(basematcher):
                 """A matcher that is the union of several matchers.
                 The non-matching-attributes (root, cwd, bad, explicitdir, traversedir) are
                 taken from the first matcher.
                 """
                 def __init__(self, matchers):
                     m1 = matchers[0]
                     super(unionmatcher, self).__init__(m1._root, m1._cwd)
                     self.explicitdir = m1.explicitdir
                     self.traversedir = m1.traversedir
                     self._matchers = matchers
                 def matchfn(self, f):
                     for match in self._matchers:
                         if match(f):
                             return True
                     return False
                 def visitdir(self, dir):
                     r = False
                     for m in self._matchers:
                         v = m.visitdir(dir)
                         if v == 'all':
                             return v
                         r |= v
                     return r
                 @encoding.strmethod
                 def __repr__(self):
                     return ('<unionmatcher matchers=%r>' % self._matchers)
             def patkind(pattern, default=None):
                 '''If pattern is 'kind:pat' with a known kind, return kind.'''
                 return _patsplit(pattern, default)[0]
             def _patsplit(pattern, default):
                 """Split a string into the optional pattern kind prefix and the actual
                 pattern."""
                 if ':' in pattern:
                     kind, pat = pattern.split(':', 1)
                     if kind in allpatternkinds:
                         return kind, pat
                 return default, pattern
             def _globre(pat):
                 r'''Convert an extended glob string to a regexp string.
                 >>> from . import pycompat
                 >>> def bprint(s):
                 ...     print(pycompat.sysstr(s))
                 >>> bprint(_globre(br'?'))
                 .
                 >>> bprint(_globre(br'*'))
                 [^/]*
                 >>> bprint(_globre(br'**'))
                 .*
                 >>> bprint(_globre(br'**/a'))
                 (?:.*/)?a
                 >>> bprint(_globre(br'a/**/b'))
                 a\/(?:.*/)?b
                 >>> bprint(_globre(br'[a*?!^][^b][!c]'))
                 [a*?!^][\^b][^c]
                 >>> bprint(_globre(br'{a,b}'))
                 (?:a|b)
                 >>> bprint(_globre(br'.\*\?'))
                 \.\*\?
                 '''
                 i, n = 0, len(pat)
                 res = ''
                 group = 0
                 escape = util.re.escape
                 def peek():
                     return i < n and pat[i:i + 1]
                 while i < n:
                     c = pat[i:i + 1]
                     i += 1
                     if c not in '*?[{},\\':
                         res += escape(c)
                     elif c == '*':
                         if peek() == '*':
                             i += 1
                             if peek() == '/':
                                 i += 1
                                 res += '(?:.*/)?'
                             else:
                                 res += '.*'
                         else:
                             res += '[^/]*'
                     elif c == '?':
                         res += '.'
                     elif c == '[':
                         j = i
                         if j < n and pat[j:j + 1] in '!]':
                             j += 1
                         while j < n and pat[j:j + 1] != ']':
                             j += 1
                         if j >= n:
                             res += '\\['
                         else:
                             stuff = pat[i:j].replace('\\','\\\\')
                             i = j + 1
                             if stuff[0:1] == '!':
                                 stuff = '^' + stuff[1:]
                             elif stuff[0:1] == '^':
                                 stuff = '\\' + stuff
                             res = '%s[%s]' % (res, stuff)
                     elif c == '{':
                         group += 1
                         res += '(?:'
                     elif c == '}' and group:
                         res += ')'
                         group -= 1
                     elif c == ',' and group:
                         res += '|'
                     elif c == '\\':
                         p = peek()
                         if p:
                             i += 1
                             res += escape(p)
                         else:
                             res += escape(c)
                     else:
                         res += escape(c)
                 return res
             def _regex(kind, pat, globsuffix):
                 '''Convert a (normalized) pattern of any kind into a regular expression.
                 globsuffix is appended to the regexp of globs.'''
                 if not pat:
                     return ''
                 if kind == 're':
                     return pat
                 if kind in ('path', 'relpath'):
                     if pat == '.':
                         return ''
                     return util.re.escape(pat) + '(?:/|$)'
                 if kind == 'rootfilesin':
                     if pat == '.':
                         escaped = ''
                     else:
                         # Pattern is a directory name.
                         escaped = util.re.escape(pat) + '/'
                     # Anything after the pattern must be a non-directory.
                     return escaped + '[^/]+$'
                 if kind == 'relglob':
                     return '(?:|.*/)' + _globre(pat) + globsuffix
                 if kind == 'relre':
                     if pat.startswith('^'):
                         return pat
                     return '.*' + pat
                 return _globre(pat) + globsuffix
             def _buildmatch(ctx, kindpats, globsuffix, listsubrepos, root):
                 '''Return regexp string and a matcher function for kindpats.
                 globsuffix is appended to the regexp of globs.'''
                 matchfuncs = []
                 subincludes, kindpats = _expandsubinclude(kindpats, root)
                 if subincludes:
                     submatchers = {}
                     def matchsubinclude(f):
                         for prefix, matcherargs in subincludes:
                             if f.startswith(prefix):
                                 mf = submatchers.get(prefix)
                                 if mf is None:
                                     mf = match(*matcherargs)
                                     submatchers[prefix] = mf
                                 if mf(f[len(prefix):]):
                                     return True
                         return False
                     matchfuncs.append(matchsubinclude)
                 fset, kindpats = _expandsets(kindpats, ctx, listsubrepos)
                 if fset:
                     matchfuncs.append(fset.__contains__)
                 regex = ''
                 if kindpats:
                     regex, mf = _buildregexmatch(kindpats, globsuffix)
                     matchfuncs.append(mf)
                 if len(matchfuncs) == 1:
                     return regex, matchfuncs[0]
                 else:
                     return regex, lambda f: any(mf(f) for mf in matchfuncs)
             def _buildregexmatch(kindpats, globsuffix):
                 """Build a match function from a list of kinds and kindpats,
                 return regexp string and a matcher function."""
                 try:
                     regex = '(?:%s)' % '|'.join([_regex(k, p, globsuffix)
                                                  for (k, p, s) in kindpats])
                     if len(regex) > 20000:
                         raise OverflowError
                     return regex, _rematcher(regex)
                 except OverflowError:
                     # We're using a Python with a tiny regex engine and we
                     # made it explode, so we'll divide the pattern list in two
                     # until it works
                     l = len(kindpats)
                     if l < 2:
                         raise
                     regexa, a = _buildregexmatch(kindpats[:l//2], globsuffix)
                     regexb, b = _buildregexmatch(kindpats[l//2:], globsuffix)
                     return regex, lambda s: a(s) or b(s)
                 except re.error:
                     for k, p, s in kindpats:
                         try:
                             _rematcher('(?:%s)' % _regex(k, p, globsuffix))
                         except re.error:
                             if s:
                                 raise error.Abort(_("%s: invalid pattern (%s): %s") %
                                                  (s, k, p))
                             else:
                                 raise error.Abort(_("invalid pattern (%s): %s") % (k, p))
                     raise error.Abort(_("invalid pattern"))
             def _patternrootsanddirs(kindpats):
                 '''Returns roots and directories corresponding to each pattern.
                 This calculates the roots and directories exactly matching the patterns and
                 returns a tuple of (roots, dirs) for each. It does not return other
                 directories which may also need to be considered, like the parent
                 directories.
                 '''
                 r = []
                 d = []
                 for kind, pat, source in kindpats:
                     if kind == 'glob': # find the non-glob prefix
                         root = []
                         for p in pat.split('/'):
                             if '[' in p or '{' in p or '*' in p or '?' in p:
                                 break
                             root.append(p)
                         r.append('/'.join(root) or '.')
                     elif kind in ('relpath', 'path'):
                         r.append(pat or '.')
                     elif kind in ('rootfilesin',):
                         d.append(pat or '.')
                     else: # relglob, re, relre
                         r.append('.')
                 return r, d
             def _roots(kindpats):
                 '''Returns root directories to match recursively from the given patterns.'''
                 roots, dirs = _patternrootsanddirs(kindpats)
                 return roots
             def _rootsanddirs(kindpats):
                 '''Returns roots and exact directories from patterns.
                 roots are directories to match recursively, whereas exact directories should
                 be matched non-recursively. The returned (roots, dirs) tuple will also
                 include directories that need to be implicitly considered as either, such as
                 parent directories.
                 >>> _rootsanddirs(
                 ...     [(b'glob', b'g/h/*', b''), (b'glob', b'g/h', b''),
                 ...      (b'glob', b'g*', b'')])
                 (['g/h', 'g/h', '.'], ['g', '.'])
                 >>> _rootsanddirs(
                 ...     [(b'rootfilesin', b'g/h', b''), (b'rootfilesin', b'', b'')])
                 ([], ['g/h', '.', 'g', '.'])
                 >>> _rootsanddirs(
                 ...     [(b'relpath', b'r', b''), (b'path', b'p/p', b''),
                 ...      (b'path', b'', b'')])
                 (['r', 'p/p', '.'], ['p', '.'])
                 >>> _rootsanddirs(
                 ...     [(b'relglob', b'rg*', b''), (b're', b're/', b''),
                 ...      (b'relre', b'rr', b'')])
                 (['.', '.', '.'], ['.'])
                 '''
                 r, d = _patternrootsanddirs(kindpats)
                 # Append the parents as non-recursive/exact directories, since they must be
                 # scanned to get to either the roots or the other exact directories.
                 d.extend(util.dirs(d))
                 d.extend(util.dirs(r))
                 # util.dirs() does not include the root directory, so add it manually
                 d.append('.')
                 return r, d
             def _explicitfiles(kindpats):
                 '''Returns the potential explicit filenames from the patterns.
                 >>> _explicitfiles([(b'path', b'foo/bar', b'')])
                 ['foo/bar']
                 >>> _explicitfiles([(b'rootfilesin', b'foo/bar', b'')])
                 []
                 '''
                 # Keep only the pattern kinds where one can specify filenames (vs only
                 # directory names).
                 filable = [kp for kp in kindpats if kp[0] not in ('rootfilesin',)]
                 return _roots(filable)
             def _prefix(kindpats):
                 '''Whether all the patterns match a prefix (i.e. recursively)'''
                 for kind, pat, source in kindpats:
                     if kind not in ('path', 'relpath'):
                         return False
                 return True
             _commentre = None
             def readpatternfile(filepath, warn, sourceinfo=False):
                 '''parse a pattern file, returning a list of
                 patterns. These patterns should be given to compile()
                 to be validated and converted into a match function.
                 trailing white space is dropped.
                 the escape character is backslash.
                 comments start with #.
                 empty lines are skipped.
                 lines can be of the following formats:
                 syntax: regexp # defaults following lines to non-rooted regexps
                 syntax: glob   # defaults following lines to non-rooted globs
                 re:pattern     # non-rooted regular expression
                 glob:pattern   # non-rooted glob
                 pattern        # pattern of the current default type
                 if sourceinfo is set, returns a list of tuples:
                 (pattern, lineno, originalline). This is useful to debug ignore patterns.
                 '''
                 syntaxes = {'re': 'relre:', 'regexp': 'relre:', 'glob': 'relglob:',
                             'include': 'include', 'subinclude': 'subinclude'}
                 syntax = 'relre:'
                 patterns = []
                 fp = open(filepath, 'rb')
                 for lineno, line in enumerate(util.iterfile(fp), start=1):
                     if "#" in line:
                         global _commentre
                         if not _commentre:
                             _commentre = util.re.compile(br'((?:^|[^\\])(?:\\\\)*)#.*')
                         # remove comments prefixed by an even number of escapes
                         m = _commentre.search(line)
                         if m:
                             line = line[:m.end(1)]
                         # fixup properly escaped comments that survived the above
                         line = line.replace("\\#", "#")
                     line = line.rstrip()
                     if not line:
                         continue
                     if line.startswith('syntax:'):
                         s = line[7:].strip()
                         try:
                             syntax = syntaxes[s]
                         except KeyError:
                             if warn:
                                 warn(_("%s: ignoring invalid syntax '%s'\n") %
                                      (filepath, s))
                         continue
                     linesyntax = syntax
                     for s, rels in syntaxes.iteritems():
                         if line.startswith(rels):
                             linesyntax = rels
                             line = line[len(rels):]
                             break
                         elif line.startswith(s+':'):
                             linesyntax = rels
                             line = line[len(s) + 1:]
                             break
                     if sourceinfo:
                         patterns.append((linesyntax + line, lineno, line))
                     else:
                         patterns.append(linesyntax + line)
                 fp.close()
                 return patterns