upstream/mercurial-mirror Commit - r36590:9adfa487

1

# match.py - filename matching

1

# match.py - filename matching

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import, print_function

8

from __future__ import absolute_import, print_function

9

10

import copy

10

import copy

11

import os

11

import os

12

import re

12

import re

13

14

from .i18n import _

14

from .i18n import _

15

from . import (

15

from . import (

16

encoding,

16

encoding,

17

error,

17

error,

18

pathutil,

18

pathutil,

19

pycompat,

19

util,

20

util,

20

)

21

)

21

22

allpatternkinds = ('re', 'glob', 'path', 'relglob', 'relpath', 'relre',

23

allpatternkinds = ('re', 'glob', 'path', 'relglob', 'relpath', 'relre',

23

'listfile', 'listfile0', 'set', 'include', 'subinclude',

24

'listfile', 'listfile0', 'set', 'include', 'subinclude',

24

'rootfilesin')

25

'rootfilesin')

25

cwdrelativepatternkinds = ('relpath', 'glob')

26

cwdrelativepatternkinds = ('relpath', 'glob')

26

27

propertycache = util.propertycache

28

propertycache = util.propertycache

28

29

def _rematcher(regex):

30

def _rematcher(regex):

30

'''compile the regexp with the best available regexp engine and return a

31

'''compile the regexp with the best available regexp engine and return a

31

matcher function'''

32

matcher function'''

32

m = util.re.compile(regex)

33

m = util.re.compile(regex)

33

try:

34

try:

34

# slightly faster, provided by facebook's re2 bindings

35

# slightly faster, provided by facebook's re2 bindings

35

return m.test_match

36

return m.test_match

36

except AttributeError:

37

except AttributeError:

37

return m.match

38

return m.match

38

39

def _expandsets(kindpats, ctx, listsubrepos):

40

def _expandsets(kindpats, ctx, listsubrepos):

40

'''Returns the kindpats list with the 'set' patterns expanded.'''

41

'''Returns the kindpats list with the 'set' patterns expanded.'''

41

fset = set()

42

fset = set()

42

other = []

43

other = []

43

44

for kind, pat, source in kindpats:

45

for kind, pat, source in kindpats:

45

if kind == 'set':

46

if kind == 'set':

46

if not ctx:

47

if not ctx:

47

raise error.ProgrammingError("fileset expression with no "

48

raise error.ProgrammingError("fileset expression with no "

48

"context")

49

"context")

49

s = ctx.getfileset(pat)

50

s = ctx.getfileset(pat)

50

fset.update(s)

51

fset.update(s)

51

52

if listsubrepos:

53

if listsubrepos:

53

for subpath in ctx.substate:

54

for subpath in ctx.substate:

54

s = ctx.sub(subpath).getfileset(pat)

55

s = ctx.sub(subpath).getfileset(pat)

55

fset.update(subpath + '/' + f for f in s)

56

fset.update(subpath + '/' + f for f in s)

56

57

continue

58

continue

58

other.append((kind, pat, source))

59

other.append((kind, pat, source))

59

return fset, other

60

return fset, other

60

61

def _expandsubinclude(kindpats, root):

62

def _expandsubinclude(kindpats, root):

62

'''Returns the list of subinclude matcher args and the kindpats without the

63

'''Returns the list of subinclude matcher args and the kindpats without the

63

subincludes in it.'''

64

subincludes in it.'''

64

relmatchers = []

65

relmatchers = []

65

other = []

66

other = []

66

67

for kind, pat, source in kindpats:

68

for kind, pat, source in kindpats:

68

if kind == 'subinclude':

69

if kind == 'subinclude':

69

sourceroot = pathutil.dirname(util.normpath(source))

70

sourceroot = pathutil.dirname(util.normpath(source))

70

pat = util.pconvert(pat)

71

pat = util.pconvert(pat)

71

path = pathutil.join(sourceroot, pat)

72

path = pathutil.join(sourceroot, pat)

72

73

newroot = pathutil.dirname(path)

74

newroot = pathutil.dirname(path)

74

matcherargs = (newroot, '', [], ['include:%s' % path])

75

matcherargs = (newroot, '', [], ['include:%s' % path])

75

76

prefix = pathutil.canonpath(root, root, newroot)

77

prefix = pathutil.canonpath(root, root, newroot)

77

if prefix:

78

if prefix:

78

prefix += '/'

79

prefix += '/'

79

relmatchers.append((prefix, matcherargs))

80

relmatchers.append((prefix, matcherargs))

80

else:

81

else:

81

other.append((kind, pat, source))

82

other.append((kind, pat, source))

82

83

return relmatchers, other

84

return relmatchers, other

84

85

def _kindpatsalwaysmatch(kindpats):

86

def _kindpatsalwaysmatch(kindpats):

86

""""Checks whether the kindspats match everything, as e.g.

87

""""Checks whether the kindspats match everything, as e.g.

87

'relpath:.' does.

88

'relpath:.' does.

88

"""

89

"""

89

for kind, pat, source in kindpats:

90

for kind, pat, source in kindpats:

90

if pat != '' or kind not in ['relpath', 'glob']:

91

if pat != '' or kind not in ['relpath', 'glob']:

91

return False

92

return False

92

return True

93

return True

93

94

def match(root, cwd, patterns=None, include=None, exclude=None, default='glob',

95

def match(root, cwd, patterns=None, include=None, exclude=None, default='glob',

95

exact=False, auditor=None, ctx=None, listsubrepos=False, warn=None,

96

exact=False, auditor=None, ctx=None, listsubrepos=False, warn=None,

96

badfn=None, icasefs=False):

97

badfn=None, icasefs=False):

97

"""build an object to match a set of file patterns

98

"""build an object to match a set of file patterns

98

99

arguments:

100

arguments:

100

root - the canonical root of the tree you're matching against

101

root - the canonical root of the tree you're matching against

101

cwd - the current working directory, if relevant

102

cwd - the current working directory, if relevant

102

patterns - patterns to find

103

patterns - patterns to find

103

include - patterns to include (unless they are excluded)

104

include - patterns to include (unless they are excluded)

104

exclude - patterns to exclude (even if they are included)

105

exclude - patterns to exclude (even if they are included)

105

default - if a pattern in patterns has no explicit type, assume this one

106

default - if a pattern in patterns has no explicit type, assume this one

106

exact - patterns are actually filenames (include/exclude still apply)

107

exact - patterns are actually filenames (include/exclude still apply)

107

warn - optional function used for printing warnings

108

warn - optional function used for printing warnings

108

badfn - optional bad() callback for this matcher instead of the default

109

badfn - optional bad() callback for this matcher instead of the default

109

icasefs - make a matcher for wdir on case insensitive filesystems, which

110

icasefs - make a matcher for wdir on case insensitive filesystems, which

110

normalizes the given patterns to the case in the filesystem

111

normalizes the given patterns to the case in the filesystem

111

112

a pattern is one of:

113

a pattern is one of:

113

'glob:<glob>' - a glob relative to cwd

114

'glob:<glob>' - a glob relative to cwd

114

're:<regexp>' - a regular expression

115

're:<regexp>' - a regular expression

115

'path:<path>' - a path relative to repository root, which is matched

116

'path:<path>' - a path relative to repository root, which is matched

116

recursively

117

recursively

117

'rootfilesin:<path>' - a path relative to repository root, which is

118

'rootfilesin:<path>' - a path relative to repository root, which is

118

matched non-recursively (will not match subdirectories)

119

matched non-recursively (will not match subdirectories)

119

'relglob:<glob>' - an unrooted glob (*.c matches C files in all dirs)

120

'relglob:<glob>' - an unrooted glob (*.c matches C files in all dirs)

120

'relpath:<path>' - a path relative to cwd

121

'relpath:<path>' - a path relative to cwd

121

'relre:<regexp>' - a regexp that needn't match the start of a name

122

'relre:<regexp>' - a regexp that needn't match the start of a name

122

'set:<fileset>' - a fileset expression

123

'set:<fileset>' - a fileset expression

123

'include:<path>' - a file of patterns to read and include

124

'include:<path>' - a file of patterns to read and include

124

'subinclude:<path>' - a file of patterns to match against files under

125

'subinclude:<path>' - a file of patterns to match against files under

125

the same directory

126

the same directory

126

'<something>' - a pattern of the specified default type

127

'<something>' - a pattern of the specified default type

127

"""

128

"""

128

normalize = _donormalize

129

normalize = _donormalize

129

if icasefs:

130

if icasefs:

130

if exact:

131

if exact:

131

raise error.ProgrammingError("a case-insensitive exact matcher "

132

raise error.ProgrammingError("a case-insensitive exact matcher "

132

"doesn't make sense")

133

"doesn't make sense")

133

dirstate = ctx.repo().dirstate

134

dirstate = ctx.repo().dirstate

134

dsnormalize = dirstate.normalize

135

dsnormalize = dirstate.normalize

135

136

def normalize(patterns, default, root, cwd, auditor, warn):

137

def normalize(patterns, default, root, cwd, auditor, warn):

137

kp = _donormalize(patterns, default, root, cwd, auditor, warn)

138

kp = _donormalize(patterns, default, root, cwd, auditor, warn)

138

kindpats = []

139

kindpats = []

139

for kind, pats, source in kp:

140

for kind, pats, source in kp:

140

if kind not in ('re', 'relre'): # regex can't be normalized

141

if kind not in ('re', 'relre'): # regex can't be normalized

141

p = pats

142

p = pats

142

pats = dsnormalize(pats)

143

pats = dsnormalize(pats)

143

144

# Preserve the original to handle a case only rename.

145

# Preserve the original to handle a case only rename.

145

if p != pats and p in dirstate:

146

if p != pats and p in dirstate:

146

kindpats.append((kind, p, source))

147

kindpats.append((kind, p, source))

147

148

kindpats.append((kind, pats, source))

149

kindpats.append((kind, pats, source))

149

return kindpats

150

return kindpats

150

151

if exact:

152

if exact:

152

m = exactmatcher(root, cwd, patterns, badfn)

153

m = exactmatcher(root, cwd, patterns, badfn)

153

elif patterns:

154

elif patterns:

154

kindpats = normalize(patterns, default, root, cwd, auditor, warn)

155

kindpats = normalize(patterns, default, root, cwd, auditor, warn)

155

if _kindpatsalwaysmatch(kindpats):

156

if _kindpatsalwaysmatch(kindpats):

156

m = alwaysmatcher(root, cwd, badfn, relativeuipath=True)

157

m = alwaysmatcher(root, cwd, badfn, relativeuipath=True)

157

else:

158

else:

158

m = patternmatcher(root, cwd, kindpats, ctx=ctx,

159

m = patternmatcher(root, cwd, kindpats, ctx=ctx,

159

listsubrepos=listsubrepos, badfn=badfn)

160

listsubrepos=listsubrepos, badfn=badfn)

160

else:

161

else:

161

# It's a little strange that no patterns means to match everything.

162

# It's a little strange that no patterns means to match everything.

162

# Consider changing this to match nothing (probably using nevermatcher).

163

# Consider changing this to match nothing (probably using nevermatcher).

163

m = alwaysmatcher(root, cwd, badfn)

164

m = alwaysmatcher(root, cwd, badfn)

164

165

if include:

166

if include:

166

kindpats = normalize(include, 'glob', root, cwd, auditor, warn)

167

kindpats = normalize(include, 'glob', root, cwd, auditor, warn)

167

im = includematcher(root, cwd, kindpats, ctx=ctx,

168

im = includematcher(root, cwd, kindpats, ctx=ctx,

168

listsubrepos=listsubrepos, badfn=None)

169

listsubrepos=listsubrepos, badfn=None)

169

m = intersectmatchers(m, im)

170

m = intersectmatchers(m, im)

170

if exclude:

171

if exclude:

171

kindpats = normalize(exclude, 'glob', root, cwd, auditor, warn)

172

kindpats = normalize(exclude, 'glob', root, cwd, auditor, warn)

172

em = includematcher(root, cwd, kindpats, ctx=ctx,

173

em = includematcher(root, cwd, kindpats, ctx=ctx,

173

listsubrepos=listsubrepos, badfn=None)

174

listsubrepos=listsubrepos, badfn=None)

174

m = differencematcher(m, em)

175

m = differencematcher(m, em)

175

return m

176

return m

176

177

def exact(root, cwd, files, badfn=None):

178

def exact(root, cwd, files, badfn=None):

178

return exactmatcher(root, cwd, files, badfn=badfn)

179

return exactmatcher(root, cwd, files, badfn=badfn)

179

180

def always(root, cwd):

181

def always(root, cwd):

181

return alwaysmatcher(root, cwd)

182

return alwaysmatcher(root, cwd)

182

183

def never(root, cwd):

184

def never(root, cwd):

184

return nevermatcher(root, cwd)

185

return nevermatcher(root, cwd)

185

186

def badmatch(match, badfn):

187

def badmatch(match, badfn):

187

"""Make a copy of the given matcher, replacing its bad method with the given

188

"""Make a copy of the given matcher, replacing its bad method with the given

188

one.

189

one.

189

"""

190

"""

190

m = copy.copy(match)

191

m = copy.copy(match)

191

m.bad = badfn

192

m.bad = badfn

192

return m

193

return m

193

194

def _donormalize(patterns, default, root, cwd, auditor, warn):

195

def _donormalize(patterns, default, root, cwd, auditor, warn):

195

'''Convert 'kind:pat' from the patterns list to tuples with kind and

196

'''Convert 'kind:pat' from the patterns list to tuples with kind and

196

normalized and rooted patterns and with listfiles expanded.'''

197

normalized and rooted patterns and with listfiles expanded.'''

197

kindpats = []

198

kindpats = []

198

for kind, pat in [_patsplit(p, default) for p in patterns]:

199

for kind, pat in [_patsplit(p, default) for p in patterns]:

199

if kind in cwdrelativepatternkinds:

200

if kind in cwdrelativepatternkinds:

200

pat = pathutil.canonpath(root, cwd, pat, auditor)

201

pat = pathutil.canonpath(root, cwd, pat, auditor)

201

elif kind in ('relglob', 'path', 'rootfilesin'):

202

elif kind in ('relglob', 'path', 'rootfilesin'):

202

pat = util.normpath(pat)

203

pat = util.normpath(pat)

203

elif kind in ('listfile', 'listfile0'):

204

elif kind in ('listfile', 'listfile0'):

204

try:

205

try:

205

files = util.readfile(pat)

206

files = util.readfile(pat)

206

if kind == 'listfile0':

207

if kind == 'listfile0':

207

files = files.split('\0')

208

files = files.split('\0')

208

else:

209

else:

209

files = files.splitlines()

210

files = files.splitlines()

210

files = [f for f in files if f]

211

files = [f for f in files if f]

211

except EnvironmentError:

212

except EnvironmentError:

212

raise error.Abort(_("unable to read file list (%s)") % pat)

213

raise error.Abort(_("unable to read file list (%s)") % pat)

213

for k, p, source in _donormalize(files, default, root, cwd,

214

for k, p, source in _donormalize(files, default, root, cwd,

214

auditor, warn):

215

auditor, warn):

215

kindpats.append((k, p, pat))

216

kindpats.append((k, p, pat))

216

continue

217

continue

217

elif kind == 'include':

218

elif kind == 'include':

218

try:

219

try:

219

fullpath = os.path.join(root, util.localpath(pat))

220

fullpath = os.path.join(root, util.localpath(pat))

220

includepats = readpatternfile(fullpath, warn)

221

includepats = readpatternfile(fullpath, warn)

221

for k, p, source in _donormalize(includepats, default,

222

for k, p, source in _donormalize(includepats, default,

222

root, cwd, auditor, warn):

223

root, cwd, auditor, warn):

223

kindpats.append((k, p, source or pat))

224

kindpats.append((k, p, source or pat))

224

except error.Abort as inst:

225

except error.Abort as inst:

225

raise error.Abort('%s: %s' % (pat, inst[0]))

226

raise error.Abort('%s: %s' % (pat, inst[0]))

226

except IOError as inst:

227

except IOError as inst:

227

if warn:

228

if warn:

228

warn(_("skipping unreadable pattern file '%s': %s\n") %

229

warn(_("skipping unreadable pattern file '%s': %s\n") %

229

(pat, inst.strerror))

230

(pat, util.forcebytestr(inst.strerror)))

230

continue

231

continue

231

# else: re or relre - which cannot be normalized

232

# else: re or relre - which cannot be normalized

232

kindpats.append((kind, pat, ''))

233

kindpats.append((kind, pat, ''))

233

return kindpats

234

return kindpats

234

235

class basematcher(object):

236

class basematcher(object):

236

237

def __init__(self, root, cwd, badfn=None, relativeuipath=True):

238

def __init__(self, root, cwd, badfn=None, relativeuipath=True):

238

self._root = root

239

self._root = root

239

self._cwd = cwd

240

self._cwd = cwd

240

if badfn is not None:

241

if badfn is not None:

241

self.bad = badfn

242

self.bad = badfn

242

self._relativeuipath = relativeuipath

243

self._relativeuipath = relativeuipath

243

244

def __call__(self, fn):

245

def __call__(self, fn):

245

return self.matchfn(fn)

246

return self.matchfn(fn)

246

def __iter__(self):

247

def __iter__(self):

247

for f in self._files:

248

for f in self._files:

248

yield f

249

yield f

249

# Callbacks related to how the matcher is used by dirstate.walk.

250

# Callbacks related to how the matcher is used by dirstate.walk.

250

# Subscribers to these events must monkeypatch the matcher object.

251

# Subscribers to these events must monkeypatch the matcher object.

251

def bad(self, f, msg):

252

def bad(self, f, msg):

252

'''Callback from dirstate.walk for each explicit file that can't be

253

'''Callback from dirstate.walk for each explicit file that can't be

253

found/accessed, with an error message.'''

254

found/accessed, with an error message.'''

254

255

# If an explicitdir is set, it will be called when an explicitly listed

256

# If an explicitdir is set, it will be called when an explicitly listed

256

# directory is visited.

257

# directory is visited.

257

explicitdir = None

258

explicitdir = None

258

259

# If an traversedir is set, it will be called when a directory discovered

260

# If an traversedir is set, it will be called when a directory discovered

260

# by recursive traversal is visited.

261

# by recursive traversal is visited.

261

traversedir = None

262

traversedir = None

262

263

def abs(self, f):

264

def abs(self, f):

264

'''Convert a repo path back to path that is relative to the root of the

265

'''Convert a repo path back to path that is relative to the root of the

265

matcher.'''

266

matcher.'''

266

return f

267

return f

267

268

def rel(self, f):

269

def rel(self, f):

269

'''Convert repo path back to path that is relative to cwd of matcher.'''

270

'''Convert repo path back to path that is relative to cwd of matcher.'''

270

return util.pathto(self._root, self._cwd, f)

271

return util.pathto(self._root, self._cwd, f)

271

272

def uipath(self, f):

273

def uipath(self, f):

273

'''Convert repo path to a display path. If patterns or -I/-X were used

274

'''Convert repo path to a display path. If patterns or -I/-X were used

274

to create this matcher, the display path will be relative to cwd.

275

to create this matcher, the display path will be relative to cwd.

275

Otherwise it is relative to the root of the repo.'''

276

Otherwise it is relative to the root of the repo.'''

276

return (self._relativeuipath and self.rel(f)) or self.abs(f)

277

return (self._relativeuipath and self.rel(f)) or self.abs(f)

277

278

@propertycache

279

@propertycache

279

def _files(self):

280

def _files(self):

280

return []

281

return []

281

282

def files(self):

283

def files(self):

283

'''Explicitly listed files or patterns or roots:

284

'''Explicitly listed files or patterns or roots:

284

if no patterns or .always(): empty list,

285

if no patterns or .always(): empty list,

285

if exact: list exact files,

286

if exact: list exact files,

286

if not .anypats(): list all files and dirs,

287

if not .anypats(): list all files and dirs,

287

else: optimal roots'''

288

else: optimal roots'''

288

return self._files

289

return self._files

289

290

@propertycache

291

@propertycache

291

def _fileset(self):

292

def _fileset(self):

292

return set(self._files)

293

return set(self._files)

293

294

def exact(self, f):

295

def exact(self, f):

295

'''Returns True if f is in .files().'''

296

'''Returns True if f is in .files().'''

296

return f in self._fileset

297

return f in self._fileset

297

298

def matchfn(self, f):

299

def matchfn(self, f):

299

return False

300

return False

300

301

def visitdir(self, dir):

302

def visitdir(self, dir):

302

'''Decides whether a directory should be visited based on whether it

303

'''Decides whether a directory should be visited based on whether it

303

has potential matches in it or one of its subdirectories. This is

304

has potential matches in it or one of its subdirectories. This is

304

based on the match's primary, included, and excluded patterns.

305

based on the match's primary, included, and excluded patterns.

305

306

Returns the string 'all' if the given directory and all subdirectories

307

Returns the string 'all' if the given directory and all subdirectories

307

should be visited. Otherwise returns True or False indicating whether

308

should be visited. Otherwise returns True or False indicating whether

308

the given directory should be visited.

309

the given directory should be visited.

309

'''

310

'''

310

return True

311

return True

311

312

def always(self):

313

def always(self):

313

'''Matcher will match everything and .files() will be empty --

314

'''Matcher will match everything and .files() will be empty --

314

optimization might be possible.'''

315

optimization might be possible.'''

315

return False

316

return False

316

317

def isexact(self):

318

def isexact(self):

318

'''Matcher will match exactly the list of files in .files() --

319

'''Matcher will match exactly the list of files in .files() --

319

optimization might be possible.'''

320

optimization might be possible.'''

320

return False

321

return False

321

322

def prefix(self):

323

def prefix(self):

323

'''Matcher will match the paths in .files() recursively --

324

'''Matcher will match the paths in .files() recursively --

324

optimization might be possible.'''

325

optimization might be possible.'''

325

return False

326

return False

326

327

def anypats(self):

328

def anypats(self):

328

'''None of .always(), .isexact(), and .prefix() is true --

329

'''None of .always(), .isexact(), and .prefix() is true --

329

optimizations will be difficult.'''

330

optimizations will be difficult.'''

330

return not self.always() and not self.isexact() and not self.prefix()

331

return not self.always() and not self.isexact() and not self.prefix()

331

332

class alwaysmatcher(basematcher):

333

class alwaysmatcher(basematcher):

333

'''Matches everything.'''

334

'''Matches everything.'''

334

335

def __init__(self, root, cwd, badfn=None, relativeuipath=False):

336

def __init__(self, root, cwd, badfn=None, relativeuipath=False):

336

super(alwaysmatcher, self).__init__(root, cwd, badfn,

337

super(alwaysmatcher, self).__init__(root, cwd, badfn,

337

relativeuipath=relativeuipath)

338

relativeuipath=relativeuipath)

338

339

def always(self):

340

def always(self):

340

return True

341

return True

341

342

def matchfn(self, f):

343

def matchfn(self, f):

343

return True

344

return True

344

345

def visitdir(self, dir):

346

def visitdir(self, dir):

346

return 'all'

347

return 'all'

347

348

def __repr__(self):

349

def __repr__(self):

349

return r'<alwaysmatcher>'

350

return r'<alwaysmatcher>'

350

351

class nevermatcher(basematcher):

352

class nevermatcher(basematcher):

352

'''Matches nothing.'''

353

'''Matches nothing.'''

353

354

def __init__(self, root, cwd, badfn=None):

355

def __init__(self, root, cwd, badfn=None):

355

super(nevermatcher, self).__init__(root, cwd, badfn)

356

super(nevermatcher, self).__init__(root, cwd, badfn)

356

357

# It's a little weird to say that the nevermatcher is an exact matcher

358

# It's a little weird to say that the nevermatcher is an exact matcher

358

# or a prefix matcher, but it seems to make sense to let callers take

359

# or a prefix matcher, but it seems to make sense to let callers take

359

# fast paths based on either. There will be no exact matches, nor any

360

# fast paths based on either. There will be no exact matches, nor any

360

# prefixes (files() returns []), so fast paths iterating over them should

361

# prefixes (files() returns []), so fast paths iterating over them should

361

# be efficient (and correct).

362

# be efficient (and correct).

362

def isexact(self):

363

def isexact(self):

363

return True

364

return True

364

365

def prefix(self):

366

def prefix(self):

366

return True

367

return True

367

368

def visitdir(self, dir):

369

def visitdir(self, dir):

369

return False

370

return False

370

371

def __repr__(self):

372

def __repr__(self):

372

return r'<nevermatcher>'

373

return r'<nevermatcher>'

373

374

class patternmatcher(basematcher):

375

class patternmatcher(basematcher):

375

376

def __init__(self, root, cwd, kindpats, ctx=None, listsubrepos=False,

377

def __init__(self, root, cwd, kindpats, ctx=None, listsubrepos=False,

377

badfn=None):

378

badfn=None):

378

super(patternmatcher, self).__init__(root, cwd, badfn)

379

super(patternmatcher, self).__init__(root, cwd, badfn)

379

380

self._files = _explicitfiles(kindpats)

381

self._files = _explicitfiles(kindpats)

381

self._prefix = _prefix(kindpats)

382

self._prefix = _prefix(kindpats)

382

self._pats, self.matchfn = _buildmatch(ctx, kindpats, '$', listsubrepos,

383

self._pats, self.matchfn = _buildmatch(ctx, kindpats, '$', listsubrepos,

383

root)

384

root)

384

385

@propertycache

386

@propertycache

386

def _dirs(self):

387

def _dirs(self):

387

return set(util.dirs(self._fileset)) | {'.'}

388

return set(util.dirs(self._fileset)) | {'.'}

388

389

def visitdir(self, dir):

390

def visitdir(self, dir):

390

if self._prefix and dir in self._fileset:

391

if self._prefix and dir in self._fileset:

391

return 'all'

392

return 'all'

392

return ('.' in self._fileset or

393

return ('.' in self._fileset or

393

dir in self._fileset or

394

dir in self._fileset or

394

dir in self._dirs or

395

dir in self._dirs or

395

any(parentdir in self._fileset

396

any(parentdir in self._fileset

396

for parentdir in util.finddirs(dir)))

397

for parentdir in util.finddirs(dir)))

397

398

def prefix(self):

399

def prefix(self):

399

return self._prefix

400

return self._prefix

400

401

@encoding.strmethod

402

@encoding.strmethod

402

def __repr__(self):

403

def __repr__(self):

403

return ('<patternmatcher patterns=%r>' % self._pats)

404

return ('<patternmatcher patterns=%r>' % self._pats)

404

405

class includematcher(basematcher):

406

class includematcher(basematcher):

406

407

def __init__(self, root, cwd, kindpats, ctx=None, listsubrepos=False,

408

def __init__(self, root, cwd, kindpats, ctx=None, listsubrepos=False,

408

badfn=None):

409

badfn=None):

409

super(includematcher, self).__init__(root, cwd, badfn)

410

super(includematcher, self).__init__(root, cwd, badfn)

410

411

self._pats, self.matchfn = _buildmatch(ctx, kindpats, '(?:/|$)',

412

self._pats, self.matchfn = _buildmatch(ctx, kindpats, '(?:/|$)',

412

listsubrepos, root)

413

listsubrepos, root)

413

self._prefix = _prefix(kindpats)

414

self._prefix = _prefix(kindpats)

414

roots, dirs = _rootsanddirs(kindpats)

415

roots, dirs = _rootsanddirs(kindpats)

415

# roots are directories which are recursively included.

416

# roots are directories which are recursively included.

416

self._roots = set(roots)

417

self._roots = set(roots)

417

# dirs are directories which are non-recursively included.

418

# dirs are directories which are non-recursively included.

418

self._dirs = set(dirs)

419

self._dirs = set(dirs)

419

420

def visitdir(self, dir):

421

def visitdir(self, dir):

421

if self._prefix and dir in self._roots:

422

if self._prefix and dir in self._roots:

422

return 'all'

423

return 'all'

423

return ('.' in self._roots or

424

return ('.' in self._roots or

424

dir in self._roots or

425

dir in self._roots or

425

dir in self._dirs or

426

dir in self._dirs or

426

any(parentdir in self._roots

427

any(parentdir in self._roots

427

for parentdir in util.finddirs(dir)))

428

for parentdir in util.finddirs(dir)))

428

429

@encoding.strmethod

430

@encoding.strmethod

430

def __repr__(self):

431

def __repr__(self):

431

return ('<includematcher includes=%r>' % self._pats)

432

return ('<includematcher includes=%r>' % pycompat.bytestr(self._pats))

432

433

class exactmatcher(basematcher):

434

class exactmatcher(basematcher):

434

'''Matches the input files exactly. They are interpreted as paths, not

435

'''Matches the input files exactly. They are interpreted as paths, not

435

patterns (so no kind-prefixes).

436

patterns (so no kind-prefixes).

436

'''

437

'''

437

438

def __init__(self, root, cwd, files, badfn=None):

439

def __init__(self, root, cwd, files, badfn=None):

439

super(exactmatcher, self).__init__(root, cwd, badfn)

440

super(exactmatcher, self).__init__(root, cwd, badfn)

440

441

if isinstance(files, list):

442

if isinstance(files, list):

442

self._files = files

443

self._files = files

443

else:

444

else:

444

self._files = list(files)

445

self._files = list(files)

445

446

matchfn = basematcher.exact

447

matchfn = basematcher.exact

447

448

@propertycache

449

@propertycache

449

def _dirs(self):

450

def _dirs(self):

450

return set(util.dirs(self._fileset)) | {'.'}

451

return set(util.dirs(self._fileset)) | {'.'}

451

452

def visitdir(self, dir):

453

def visitdir(self, dir):

453

return dir in self._dirs

454

return dir in self._dirs

454

455

def isexact(self):

456

def isexact(self):

456

return True

457

return True

457

458

@encoding.strmethod

459

@encoding.strmethod

459

def __repr__(self):

460

def __repr__(self):

460

return ('<exactmatcher files=%r>' % self._files)

461

return ('<exactmatcher files=%r>' % self._files)

461

462

class differencematcher(basematcher):

463

class differencematcher(basematcher):

463

'''Composes two matchers by matching if the first matches and the second

464

'''Composes two matchers by matching if the first matches and the second

464

does not.

465

does not.

465

466

The second matcher's non-matching-attributes (root, cwd, bad, explicitdir,

467

The second matcher's non-matching-attributes (root, cwd, bad, explicitdir,

467

traversedir) are ignored.

468

traversedir) are ignored.

468

'''

469

'''

469

def __init__(self, m1, m2):

470

def __init__(self, m1, m2):

470

super(differencematcher, self).__init__(m1._root, m1._cwd)

471

super(differencematcher, self).__init__(m1._root, m1._cwd)

471

self._m1 = m1

472

self._m1 = m1

472

self._m2 = m2

473

self._m2 = m2

473

self.bad = m1.bad

474

self.bad = m1.bad

474

self.explicitdir = m1.explicitdir

475

self.explicitdir = m1.explicitdir

475

self.traversedir = m1.traversedir

476

self.traversedir = m1.traversedir

476

477

def matchfn(self, f):

478

def matchfn(self, f):

478

return self._m1(f) and not self._m2(f)

479

return self._m1(f) and not self._m2(f)

479

480

@propertycache

481

@propertycache

481

def _files(self):

482

def _files(self):

482

if self.isexact():

483

if self.isexact():

483

return [f for f in self._m1.files() if self(f)]

484

return [f for f in self._m1.files() if self(f)]

484

# If m1 is not an exact matcher, we can't easily figure out the set of

485

# If m1 is not an exact matcher, we can't easily figure out the set of

485

# files, because its files() are not always files. For example, if

486

# files, because its files() are not always files. For example, if

486

# m1 is "path:dir" and m2 is "rootfileins:.", we don't

487

# m1 is "path:dir" and m2 is "rootfileins:.", we don't

487

# want to remove "dir" from the set even though it would match m2,

488

# want to remove "dir" from the set even though it would match m2,

488

# because the "dir" in m1 may not be a file.

489

# because the "dir" in m1 may not be a file.

489

return self._m1.files()

490

return self._m1.files()

490

491

def visitdir(self, dir):

492

def visitdir(self, dir):

492

if self._m2.visitdir(dir) == 'all':

493

if self._m2.visitdir(dir) == 'all':

493

return False

494

return False

494

return bool(self._m1.visitdir(dir))

495

return bool(self._m1.visitdir(dir))

495

496

def isexact(self):

497

def isexact(self):

497

return self._m1.isexact()

498

return self._m1.isexact()

498

499

@encoding.strmethod

500

@encoding.strmethod

500

def __repr__(self):

501

def __repr__(self):

501

return ('<differencematcher m1=%r, m2=%r>' % (self._m1, self._m2))

502

return ('<differencematcher m1=%r, m2=%r>' % (self._m1, self._m2))

502

503

def intersectmatchers(m1, m2):

504

def intersectmatchers(m1, m2):

504

'''Composes two matchers by matching if both of them match.

505

'''Composes two matchers by matching if both of them match.

505

506

The second matcher's non-matching-attributes (root, cwd, bad, explicitdir,

507

The second matcher's non-matching-attributes (root, cwd, bad, explicitdir,

507

traversedir) are ignored.

508

traversedir) are ignored.

508

'''

509

'''

509

if m1 is None or m2 is None:

510

if m1 is None or m2 is None:

510

return m1 or m2

511

return m1 or m2

511

if m1.always():

512

if m1.always():

512

m = copy.copy(m2)

513

m = copy.copy(m2)

513

# TODO: Consider encapsulating these things in a class so there's only

514

# TODO: Consider encapsulating these things in a class so there's only

514

# one thing to copy from m1.

515

# one thing to copy from m1.

515

m.bad = m1.bad

516

m.bad = m1.bad

516

m.explicitdir = m1.explicitdir

517

m.explicitdir = m1.explicitdir

517

m.traversedir = m1.traversedir

518

m.traversedir = m1.traversedir

518

m.abs = m1.abs

519

m.abs = m1.abs

519

m.rel = m1.rel

520

m.rel = m1.rel

520

m._relativeuipath |= m1._relativeuipath

521

m._relativeuipath |= m1._relativeuipath

521

return m

522

return m

522

if m2.always():

523

if m2.always():

523

m = copy.copy(m1)

524

m = copy.copy(m1)

524

m._relativeuipath |= m2._relativeuipath

525

m._relativeuipath |= m2._relativeuipath

525

return m

526

return m

526

return intersectionmatcher(m1, m2)

527

return intersectionmatcher(m1, m2)

527

528

class intersectionmatcher(basematcher):

529

class intersectionmatcher(basematcher):

529

def __init__(self, m1, m2):

530

def __init__(self, m1, m2):

530

super(intersectionmatcher, self).__init__(m1._root, m1._cwd)

531

super(intersectionmatcher, self).__init__(m1._root, m1._cwd)

531

self._m1 = m1

532

self._m1 = m1

532

self._m2 = m2

533

self._m2 = m2

533

self.bad = m1.bad

534

self.bad = m1.bad

534

self.explicitdir = m1.explicitdir

535

self.explicitdir = m1.explicitdir

535

self.traversedir = m1.traversedir

536

self.traversedir = m1.traversedir

536

537

@propertycache

538

@propertycache

538

def _files(self):

539

def _files(self):

539

if self.isexact():

540

if self.isexact():

540

m1, m2 = self._m1, self._m2

541

m1, m2 = self._m1, self._m2

541

if not m1.isexact():

542

if not m1.isexact():

542

m1, m2 = m2, m1

543

m1, m2 = m2, m1

543

return [f for f in m1.files() if m2(f)]

544

return [f for f in m1.files() if m2(f)]

544

# It neither m1 nor m2 is an exact matcher, we can't easily intersect

545

# It neither m1 nor m2 is an exact matcher, we can't easily intersect

545

# the set of files, because their files() are not always files. For

546

# the set of files, because their files() are not always files. For

546

# example, if intersecting a matcher "-I glob:foo.txt" with matcher of

547

# example, if intersecting a matcher "-I glob:foo.txt" with matcher of

547

# "path:dir2", we don't want to remove "dir2" from the set.

548

# "path:dir2", we don't want to remove "dir2" from the set.

548

return self._m1.files() + self._m2.files()

549

return self._m1.files() + self._m2.files()

549

550

def matchfn(self, f):

551

def matchfn(self, f):

551

return self._m1(f) and self._m2(f)

552

return self._m1(f) and self._m2(f)

552

553

def visitdir(self, dir):

554

def visitdir(self, dir):

554

visit1 = self._m1.visitdir(dir)

555

visit1 = self._m1.visitdir(dir)

555

if visit1 == 'all':

556

if visit1 == 'all':

556

return self._m2.visitdir(dir)

557

return self._m2.visitdir(dir)

557

# bool() because visit1=True + visit2='all' should not be 'all'

558

# bool() because visit1=True + visit2='all' should not be 'all'

558

return bool(visit1 and self._m2.visitdir(dir))

559

return bool(visit1 and self._m2.visitdir(dir))

559

560

def always(self):

561

def always(self):

561

return self._m1.always() and self._m2.always()

562

return self._m1.always() and self._m2.always()

562

563

def isexact(self):

564

def isexact(self):

564

return self._m1.isexact() or self._m2.isexact()

565

return self._m1.isexact() or self._m2.isexact()

565

566

@encoding.strmethod

567

@encoding.strmethod

567

def __repr__(self):

568

def __repr__(self):

568

return ('<intersectionmatcher m1=%r, m2=%r>' % (self._m1, self._m2))

569

return ('<intersectionmatcher m1=%r, m2=%r>' % (self._m1, self._m2))

569

570

class subdirmatcher(basematcher):

571

class subdirmatcher(basematcher):

571

"""Adapt a matcher to work on a subdirectory only.

572

"""Adapt a matcher to work on a subdirectory only.

572

573

The paths are remapped to remove/insert the path as needed:

574

The paths are remapped to remove/insert the path as needed:

574

575

>>> from . import pycompat

576

>>> from . import pycompat

576

>>> m1 = match(b'root', b'', [b'a.txt', b'sub/b.txt'])

577

>>> m1 = match(b'root', b'', [b'a.txt', b'sub/b.txt'])

577

>>> m2 = subdirmatcher(b'sub', m1)

578

>>> m2 = subdirmatcher(b'sub', m1)

578

>>> bool(m2(b'a.txt'))

579

>>> bool(m2(b'a.txt'))

579

False

580

False

580

>>> bool(m2(b'b.txt'))

581

>>> bool(m2(b'b.txt'))

581

True

582

True

582

>>> bool(m2.matchfn(b'a.txt'))

583

>>> bool(m2.matchfn(b'a.txt'))

583

False

584

False

584

>>> bool(m2.matchfn(b'b.txt'))

585

>>> bool(m2.matchfn(b'b.txt'))

585

True

586

True

586

>>> m2.files()

587

>>> m2.files()

587

['b.txt']

588

['b.txt']

588

>>> m2.exact(b'b.txt')

589

>>> m2.exact(b'b.txt')

589

True

590

True

590

>>> util.pconvert(m2.rel(b'b.txt'))

591

>>> util.pconvert(m2.rel(b'b.txt'))

591

'sub/b.txt'

592

'sub/b.txt'

592

>>> def bad(f, msg):

593

>>> def bad(f, msg):

593

... print(pycompat.sysstr(b"%s: %s" % (f, msg)))

594

... print(pycompat.sysstr(b"%s: %s" % (f, msg)))

594

>>> m1.bad = bad

595

>>> m1.bad = bad

595

>>> m2.bad(b'x.txt', b'No such file')

596

>>> m2.bad(b'x.txt', b'No such file')

596

sub/x.txt: No such file

597

sub/x.txt: No such file

597

>>> m2.abs(b'c.txt')

598

>>> m2.abs(b'c.txt')

598

'sub/c.txt'

599

'sub/c.txt'

599

"""

600

"""

600

601

def __init__(self, path, matcher):

602

def __init__(self, path, matcher):

602

super(subdirmatcher, self).__init__(matcher._root, matcher._cwd)

603

super(subdirmatcher, self).__init__(matcher._root, matcher._cwd)

603

self._path = path

604

self._path = path

604

self._matcher = matcher

605

self._matcher = matcher

605

self._always = matcher.always()

606

self._always = matcher.always()

606

607

self._files = [f[len(path) + 1:] for f in matcher._files

608

self._files = [f[len(path) + 1:] for f in matcher._files

608

if f.startswith(path + "/")]

609

if f.startswith(path + "/")]

609

610

# If the parent repo had a path to this subrepo and the matcher is

611

# If the parent repo had a path to this subrepo and the matcher is

611

# a prefix matcher, this submatcher always matches.

612

# a prefix matcher, this submatcher always matches.

612

if matcher.prefix():

613

if matcher.prefix():

613

self._always = any(f == path for f in matcher._files)

614

self._always = any(f == path for f in matcher._files)

614

615

def bad(self, f, msg):

616

def bad(self, f, msg):

616

self._matcher.bad(self._path + "/" + f, msg)

617

self._matcher.bad(self._path + "/" + f, msg)

617

618

def abs(self, f):

619

def abs(self, f):

619

return self._matcher.abs(self._path + "/" + f)

620

return self._matcher.abs(self._path + "/" + f)

620

621

def rel(self, f):

622

def rel(self, f):

622

return self._matcher.rel(self._path + "/" + f)

623

return self._matcher.rel(self._path + "/" + f)

623

624

def uipath(self, f):

625

def uipath(self, f):

625

return self._matcher.uipath(self._path + "/" + f)

626

return self._matcher.uipath(self._path + "/" + f)

626

627

def matchfn(self, f):

628

def matchfn(self, f):

628

# Some information is lost in the superclass's constructor, so we

629

# Some information is lost in the superclass's constructor, so we

629

# can not accurately create the matching function for the subdirectory

630

# can not accurately create the matching function for the subdirectory

630

# from the inputs. Instead, we override matchfn() and visitdir() to

631

# from the inputs. Instead, we override matchfn() and visitdir() to

631

# call the original matcher with the subdirectory path prepended.

632

# call the original matcher with the subdirectory path prepended.

632

return self._matcher.matchfn(self._path + "/" + f)

633

return self._matcher.matchfn(self._path + "/" + f)

633

634

def visitdir(self, dir):

635

def visitdir(self, dir):

635

if dir == '.':

636

if dir == '.':

636

dir = self._path

637

dir = self._path

637

else:

638

else:

638

dir = self._path + "/" + dir

639

dir = self._path + "/" + dir

639

return self._matcher.visitdir(dir)

640

return self._matcher.visitdir(dir)

640

641

def always(self):

642

def always(self):

642

return self._always

643

return self._always

643

644

def prefix(self):

645

def prefix(self):

645

return self._matcher.prefix() and not self._always

646

return self._matcher.prefix() and not self._always

646

647

@encoding.strmethod

648

@encoding.strmethod

648

def __repr__(self):

649

def __repr__(self):

649

return ('<subdirmatcher path=%r, matcher=%r>' %

650

return ('<subdirmatcher path=%r, matcher=%r>' %

650

(self._path, self._matcher))

651

(self._path, self._matcher))

651

652

class unionmatcher(basematcher):

653

class unionmatcher(basematcher):

653

"""A matcher that is the union of several matchers.

654

"""A matcher that is the union of several matchers.

654

655

The non-matching-attributes (root, cwd, bad, explicitdir, traversedir) are

656

The non-matching-attributes (root, cwd, bad, explicitdir, traversedir) are

656

taken from the first matcher.

657

taken from the first matcher.

657

"""

658

"""

658

659

def __init__(self, matchers):

660

def __init__(self, matchers):

660

m1 = matchers[0]

661

m1 = matchers[0]

661

super(unionmatcher, self).__init__(m1._root, m1._cwd)

662

super(unionmatcher, self).__init__(m1._root, m1._cwd)

662

self.explicitdir = m1.explicitdir

663

self.explicitdir = m1.explicitdir

663

self.traversedir = m1.traversedir

664

self.traversedir = m1.traversedir

664

self._matchers = matchers

665

self._matchers = matchers

665

666

def matchfn(self, f):

667

def matchfn(self, f):

667

for match in self._matchers:

668

for match in self._matchers:

668

if match(f):

669

if match(f):

669

return True

670

return True

670

return False

671

return False

671

672

def visitdir(self, dir):

673

def visitdir(self, dir):

673

r = False

674

r = False

674

for m in self._matchers:

675

for m in self._matchers:

675

v = m.visitdir(dir)

676

v = m.visitdir(dir)

676

if v == 'all':

677

if v == 'all':

677

return v

678

return v

678

r |= v

679

r |= v

679

return r

680

return r

680

681

@encoding.strmethod

682

@encoding.strmethod

682

def __repr__(self):

683

def __repr__(self):

683

return ('<unionmatcher matchers=%r>' % self._matchers)

684

return ('<unionmatcher matchers=%r>' % self._matchers)

684

685

def patkind(pattern, default=None):

686

def patkind(pattern, default=None):

686

'''If pattern is 'kind:pat' with a known kind, return kind.'''

687

'''If pattern is 'kind:pat' with a known kind, return kind.'''

687

return _patsplit(pattern, default)[0]

688

return _patsplit(pattern, default)[0]

688

689

def _patsplit(pattern, default):

690

def _patsplit(pattern, default):

690

"""Split a string into the optional pattern kind prefix and the actual

691

"""Split a string into the optional pattern kind prefix and the actual

691

pattern."""

692

pattern."""

692

if ':' in pattern:

693

if ':' in pattern:

693

kind, pat = pattern.split(':', 1)

694

kind, pat = pattern.split(':', 1)

694

if kind in allpatternkinds:

695

if kind in allpatternkinds:

695

return kind, pat

696

return kind, pat

696

return default, pattern

697

return default, pattern

697

698

def _globre(pat):

699

def _globre(pat):

699

r'''Convert an extended glob string to a regexp string.

700

r'''Convert an extended glob string to a regexp string.

700

701

>>> from . import pycompat

702

>>> from . import pycompat

702

>>> def bprint(s):

703

>>> def bprint(s):

703

... print(pycompat.sysstr(s))

704

... print(pycompat.sysstr(s))

704

>>> bprint(_globre(br'?'))

705

>>> bprint(_globre(br'?'))

705

.

706

.

706

>>> bprint(_globre(br'*'))

707

>>> bprint(_globre(br'*'))

707

[^/]*

708

[^/]*

708

>>> bprint(_globre(br'**'))

709

>>> bprint(_globre(br'**'))

709

.*

710

.*

710

>>> bprint(_globre(br'**/a'))

711

>>> bprint(_globre(br'**/a'))

711

(?:.*/)?a

712

(?:.*/)?a

712

>>> bprint(_globre(br'a/**/b'))

713

>>> bprint(_globre(br'a/**/b'))

713

a\/(?:.*/)?b

714

a\/(?:.*/)?b

714

>>> bprint(_globre(br'[a*?!^][^b][!c]'))

715

>>> bprint(_globre(br'[a*?!^][^b][!c]'))

715

[a*?!^][\^b][^c]

716

[a*?!^][\^b][^c]

716

>>> bprint(_globre(br'{a,b}'))

717

>>> bprint(_globre(br'{a,b}'))

717

(?:a|b)

718

(?:a|b)

718

>>> bprint(_globre(br'.\*\?'))

719

>>> bprint(_globre(br'.\*\?'))

719

\.\*\?

720

\.\*\?

720

'''

721

'''

721

i, n = 0, len(pat)

722

i, n = 0, len(pat)

722

res = ''

723

res = ''

723

group = 0

724

group = 0

724

escape = util.re.escape

725

escape = util.re.escape

725

def peek():

726

def peek():

726

return i < n and pat[i:i + 1]

727

return i < n and pat[i:i + 1]

727

while i < n:

728

while i < n:

728

c = pat[i:i + 1]

729

c = pat[i:i + 1]

729

i += 1

730

i += 1

730

if c not in '*?[{},\\':

731

if c not in '*?[{},\\':

731

res += escape(c)

732

res += escape(c)

732

elif c == '*':

733

elif c == '*':

733

if peek() == '*':

734

if peek() == '*':

734

i += 1

735

i += 1

735

if peek() == '/':

736

if peek() == '/':

736

i += 1

737

i += 1

737

res += '(?:.*/)?'

738

res += '(?:.*/)?'

738

else:

739

else:

739

res += '.*'

740

res += '.*'

740

else:

741

else:

741

res += '[^/]*'

742

res += '[^/]*'

742

elif c == '?':

743

elif c == '?':

743

res += '.'

744

res += '.'

744

elif c == '[':

745

elif c == '[':

745

j = i

746

j = i

746

if j < n and pat[j:j + 1] in '!]':

747

if j < n and pat[j:j + 1] in '!]':

747

j += 1

748

j += 1

748

while j < n and pat[j:j + 1] != ']':

749

while j < n and pat[j:j + 1] != ']':

749

j += 1

750

j += 1

750

if j >= n:

751

if j >= n:

751

res += '\\['

752

res += '\\['

752

else:

753

else:

753

stuff = pat[i:j].replace('\\','\\\\')

754

stuff = pat[i:j].replace('\\','\\\\')

754

i = j + 1

755

i = j + 1

755

if stuff[0:1] == '!':

756

if stuff[0:1] == '!':

756

stuff = '^' + stuff[1:]

757

stuff = '^' + stuff[1:]

757

elif stuff[0:1] == '^':

758

elif stuff[0:1] == '^':

758

stuff = '\\' + stuff

759

stuff = '\\' + stuff

759

res = '%s[%s]' % (res, stuff)

760

res = '%s[%s]' % (res, stuff)

760

elif c == '{':

761

elif c == '{':

761

group += 1

762

group += 1

762

res += '(?:'

763

res += '(?:'

763

elif c == '}' and group:

764

elif c == '}' and group:

764

res += ')'

765

res += ')'

765

group -= 1

766

group -= 1

766

elif c == ',' and group:

767

elif c == ',' and group:

767

res += '|'

768

res += '|'

768

elif c == '\\':

769

elif c == '\\':

769

p = peek()

770

p = peek()

770

if p:

771

if p:

771

i += 1

772

i += 1

772

res += escape(p)

773

res += escape(p)

773

else:

774

else:

774

res += escape(c)

775

res += escape(c)

775

else:

776

else:

776

res += escape(c)

777

res += escape(c)

777

return res

778

return res

778

779

def _regex(kind, pat, globsuffix):

780

def _regex(kind, pat, globsuffix):

780

'''Convert a (normalized) pattern of any kind into a regular expression.

781

'''Convert a (normalized) pattern of any kind into a regular expression.

781

globsuffix is appended to the regexp of globs.'''

782

globsuffix is appended to the regexp of globs.'''

782

if not pat:

783

if not pat:

783

return ''

784

return ''

784

if kind == 're':

785

if kind == 're':

785

return pat

786

return pat

786

if kind in ('path', 'relpath'):

787

if kind in ('path', 'relpath'):

787

if pat == '.':

788

if pat == '.':

788

return ''

789

return ''

789

return util.re.escape(pat) + '(?:/|$)'

790

return util.re.escape(pat) + '(?:/|$)'

790

if kind == 'rootfilesin':

791

if kind == 'rootfilesin':

791

if pat == '.':

792

if pat == '.':

792

escaped = ''

793

escaped = ''

793

else:

794

else:

794

# Pattern is a directory name.

795

# Pattern is a directory name.

795

escaped = util.re.escape(pat) + '/'

796

escaped = util.re.escape(pat) + '/'

796

# Anything after the pattern must be a non-directory.

797

# Anything after the pattern must be a non-directory.

797

return escaped + '[^/]+$'

798

return escaped + '[^/]+$'

798

if kind == 'relglob':

799

if kind == 'relglob':

799

return '(?:|.*/)' + _globre(pat) + globsuffix

800

return '(?:|.*/)' + _globre(pat) + globsuffix

800

if kind == 'relre':

801

if kind == 'relre':

801

if pat.startswith('^'):

802

if pat.startswith('^'):

802

return pat

803

return pat

803

return '.*' + pat

804

return '.*' + pat

804

return _globre(pat) + globsuffix

805

return _globre(pat) + globsuffix

805

806

def _buildmatch(ctx, kindpats, globsuffix, listsubrepos, root):

807

def _buildmatch(ctx, kindpats, globsuffix, listsubrepos, root):

807

'''Return regexp string and a matcher function for kindpats.

808

'''Return regexp string and a matcher function for kindpats.

808

globsuffix is appended to the regexp of globs.'''

809

globsuffix is appended to the regexp of globs.'''

809

matchfuncs = []

810

matchfuncs = []

810

811

subincludes, kindpats = _expandsubinclude(kindpats, root)

812

subincludes, kindpats = _expandsubinclude(kindpats, root)

812

if subincludes:

813

if subincludes:

813

submatchers = {}

814

submatchers = {}

814

def matchsubinclude(f):

815

def matchsubinclude(f):

815

for prefix, matcherargs in subincludes:

816

for prefix, matcherargs in subincludes:

816

if f.startswith(prefix):

817

if f.startswith(prefix):

817

mf = submatchers.get(prefix)

818

mf = submatchers.get(prefix)

818

if mf is None:

819

if mf is None:

819

mf = match(*matcherargs)

820

mf = match(*matcherargs)

820

submatchers[prefix] = mf

821

submatchers[prefix] = mf

821

822

if mf(f[len(prefix):]):

823

if mf(f[len(prefix):]):

823

return True

824

return True

824

return False

825

return False

825

matchfuncs.append(matchsubinclude)

826

matchfuncs.append(matchsubinclude)

826

827

fset, kindpats = _expandsets(kindpats, ctx, listsubrepos)

828

fset, kindpats = _expandsets(kindpats, ctx, listsubrepos)

828

if fset:

829

if fset:

829

matchfuncs.append(fset.__contains__)

830

matchfuncs.append(fset.__contains__)

830

831

regex = ''

832

regex = ''

832

if kindpats:

833

if kindpats:

833

regex, mf = _buildregexmatch(kindpats, globsuffix)

834

regex, mf = _buildregexmatch(kindpats, globsuffix)

834

matchfuncs.append(mf)

835

matchfuncs.append(mf)

835

836

if len(matchfuncs) == 1:

837

if len(matchfuncs) == 1:

837

return regex, matchfuncs[0]

838

return regex, matchfuncs[0]

838

else:

839

else:

839

return regex, lambda f: any(mf(f) for mf in matchfuncs)

840

return regex, lambda f: any(mf(f) for mf in matchfuncs)

840

841

def _buildregexmatch(kindpats, globsuffix):

842

def _buildregexmatch(kindpats, globsuffix):

842

"""Build a match function from a list of kinds and kindpats,

843

"""Build a match function from a list of kinds and kindpats,

843

return regexp string and a matcher function."""

844

return regexp string and a matcher function."""

844

try:

845

try:

845

regex = '(?:%s)' % '|'.join([_regex(k, p, globsuffix)

846

regex = '(?:%s)' % '|'.join([_regex(k, p, globsuffix)

846

for (k, p, s) in kindpats])

847

for (k, p, s) in kindpats])

847

if len(regex) > 20000:

848

if len(regex) > 20000:

848

raise OverflowError

849

raise OverflowError

849

return regex, _rematcher(regex)

850

return regex, _rematcher(regex)

850

except OverflowError:

851

except OverflowError:

851

# We're using a Python with a tiny regex engine and we

852

# We're using a Python with a tiny regex engine and we

852

# made it explode, so we'll divide the pattern list in two

853

# made it explode, so we'll divide the pattern list in two

853

# until it works

854

# until it works

854

l = len(kindpats)

855

l = len(kindpats)

855

if l < 2:

856

if l < 2:

856

raise

857

raise

857

regexa, a = _buildregexmatch(kindpats[:l//2], globsuffix)

858

regexa, a = _buildregexmatch(kindpats[:l//2], globsuffix)

858

regexb, b = _buildregexmatch(kindpats[l//2:], globsuffix)

859

regexb, b = _buildregexmatch(kindpats[l//2:], globsuffix)

859

return regex, lambda s: a(s) or b(s)

860

return regex, lambda s: a(s) or b(s)

860

except re.error:

861

except re.error:

861

for k, p, s in kindpats:

862

for k, p, s in kindpats:

862

try:

863

try:

863

_rematcher('(?:%s)' % _regex(k, p, globsuffix))

864

_rematcher('(?:%s)' % _regex(k, p, globsuffix))

864

except re.error:

865

except re.error:

865

if s:

866

if s:

866

raise error.Abort(_("%s: invalid pattern (%s): %s") %

867

raise error.Abort(_("%s: invalid pattern (%s): %s") %

867

(s, k, p))

868

(s, k, p))

868

else:

869

else:

869

raise error.Abort(_("invalid pattern (%s): %s") % (k, p))

870

raise error.Abort(_("invalid pattern (%s): %s") % (k, p))

870

raise error.Abort(_("invalid pattern"))

871

raise error.Abort(_("invalid pattern"))

871

872

def _patternrootsanddirs(kindpats):

873

def _patternrootsanddirs(kindpats):

873

'''Returns roots and directories corresponding to each pattern.

874

'''Returns roots and directories corresponding to each pattern.

874

875

This calculates the roots and directories exactly matching the patterns and

876

This calculates the roots and directories exactly matching the patterns and

876

returns a tuple of (roots, dirs) for each. It does not return other

877

returns a tuple of (roots, dirs) for each. It does not return other

877

directories which may also need to be considered, like the parent

878

directories which may also need to be considered, like the parent

878

directories.

879

directories.

879

'''

880

'''

880

r = []

881

r = []

881

d = []

882

d = []

882

for kind, pat, source in kindpats:

883

for kind, pat, source in kindpats:

883

if kind == 'glob': # find the non-glob prefix

884

if kind == 'glob': # find the non-glob prefix

884

root = []

885

root = []

885

for p in pat.split('/'):

886

for p in pat.split('/'):

886

if '[' in p or '{' in p or '*' in p or '?' in p:

887

if '[' in p or '{' in p or '*' in p or '?' in p:

887

break

888

break

888

root.append(p)

889

root.append(p)

889

r.append('/'.join(root) or '.')

890

r.append('/'.join(root) or '.')

890

elif kind in ('relpath', 'path'):

891

elif kind in ('relpath', 'path'):

891

r.append(pat or '.')

892

r.append(pat or '.')

892

elif kind in ('rootfilesin',):

893

elif kind in ('rootfilesin',):

893

d.append(pat or '.')

894

d.append(pat or '.')

894

else: # relglob, re, relre

895

else: # relglob, re, relre

895

r.append('.')

896

r.append('.')

896

return r, d

897

return r, d

897

898

def _roots(kindpats):

899

def _roots(kindpats):

899

'''Returns root directories to match recursively from the given patterns.'''

900

'''Returns root directories to match recursively from the given patterns.'''

900

roots, dirs = _patternrootsanddirs(kindpats)

901

roots, dirs = _patternrootsanddirs(kindpats)

901

return roots

902

return roots

902

903

def _rootsanddirs(kindpats):

904

def _rootsanddirs(kindpats):

904

'''Returns roots and exact directories from patterns.

905

'''Returns roots and exact directories from patterns.

905

906

roots are directories to match recursively, whereas exact directories should

907

roots are directories to match recursively, whereas exact directories should

907

be matched non-recursively. The returned (roots, dirs) tuple will also

908

be matched non-recursively. The returned (roots, dirs) tuple will also

908

include directories that need to be implicitly considered as either, such as

909

include directories that need to be implicitly considered as either, such as

909

parent directories.

910

parent directories.

910

911

>>> _rootsanddirs(

912

>>> _rootsanddirs(

912

... [(b'glob', b'g/h/*', b''), (b'glob', b'g/h', b''),

913

... [(b'glob', b'g/h/*', b''), (b'glob', b'g/h', b''),

913

... (b'glob', b'g*', b'')])

914

... (b'glob', b'g*', b'')])

914

(['g/h', 'g/h', '.'], ['g', '.'])

915

(['g/h', 'g/h', '.'], ['g', '.'])

915

>>> _rootsanddirs(

916

>>> _rootsanddirs(

916

... [(b'rootfilesin', b'g/h', b''), (b'rootfilesin', b'', b'')])

917

... [(b'rootfilesin', b'g/h', b''), (b'rootfilesin', b'', b'')])

917

([], ['g/h', '.', 'g', '.'])

918

([], ['g/h', '.', 'g', '.'])

918

>>> _rootsanddirs(

919

>>> _rootsanddirs(

919

... [(b'relpath', b'r', b''), (b'path', b'p/p', b''),

920

... [(b'relpath', b'r', b''), (b'path', b'p/p', b''),

920

... (b'path', b'', b'')])

921

... (b'path', b'', b'')])

921

(['r', 'p/p', '.'], ['p', '.'])

922

(['r', 'p/p', '.'], ['p', '.'])

922

>>> _rootsanddirs(

923

>>> _rootsanddirs(

923

... [(b'relglob', b'rg*', b''), (b're', b're/', b''),

924

... [(b'relglob', b'rg*', b''), (b're', b're/', b''),

924

... (b'relre', b'rr', b'')])

925

... (b'relre', b'rr', b'')])

925

(['.', '.', '.'], ['.'])

926

(['.', '.', '.'], ['.'])

926

'''

927

'''

927

r, d = _patternrootsanddirs(kindpats)

928

r, d = _patternrootsanddirs(kindpats)

928

929

# Append the parents as non-recursive/exact directories, since they must be

930

# Append the parents as non-recursive/exact directories, since they must be

930

# scanned to get to either the roots or the other exact directories.

931

# scanned to get to either the roots or the other exact directories.

931

d.extend(util.dirs(d))

932

d.extend(util.dirs(d))

932

d.extend(util.dirs(r))

933

d.extend(util.dirs(r))

933

# util.dirs() does not include the root directory, so add it manually

934

# util.dirs() does not include the root directory, so add it manually

934

d.append('.')

935

d.append('.')

935

936

return r, d

937

return r, d

937

938

def _explicitfiles(kindpats):

939

def _explicitfiles(kindpats):

939

'''Returns the potential explicit filenames from the patterns.

940

'''Returns the potential explicit filenames from the patterns.

940

941

>>> _explicitfiles([(b'path', b'foo/bar', b'')])

942

>>> _explicitfiles([(b'path', b'foo/bar', b'')])

942

['foo/bar']

943

['foo/bar']

943

>>> _explicitfiles([(b'rootfilesin', b'foo/bar', b'')])

944

>>> _explicitfiles([(b'rootfilesin', b'foo/bar', b'')])

944

[]

945

[]

945

'''

946

'''

946

# Keep only the pattern kinds where one can specify filenames (vs only

947

# Keep only the pattern kinds where one can specify filenames (vs only

947

# directory names).

948

# directory names).

948

filable = [kp for kp in kindpats if kp[0] not in ('rootfilesin',)]

949

filable = [kp for kp in kindpats if kp[0] not in ('rootfilesin',)]

949

return _roots(filable)

950

return _roots(filable)

950

951

def _prefix(kindpats):

952

def _prefix(kindpats):

952

'''Whether all the patterns match a prefix (i.e. recursively)'''

953

'''Whether all the patterns match a prefix (i.e. recursively)'''

953

for kind, pat, source in kindpats:

954

for kind, pat, source in kindpats:

954

if kind not in ('path', 'relpath'):

955

if kind not in ('path', 'relpath'):

955

return False

956

return False

956

return True

957

return True

957

958

_commentre = None

959

_commentre = None

959

960

def readpatternfile(filepath, warn, sourceinfo=False):

961

def readpatternfile(filepath, warn, sourceinfo=False):

961

'''parse a pattern file, returning a list of

962

'''parse a pattern file, returning a list of

962

patterns. These patterns should be given to compile()

963

patterns. These patterns should be given to compile()

963

to be validated and converted into a match function.

964

to be validated and converted into a match function.

964

965

trailing white space is dropped.

966

trailing white space is dropped.

966

the escape character is backslash.

967

the escape character is backslash.

967

comments start with #.

968

comments start with #.

968

empty lines are skipped.

969

empty lines are skipped.

969

970

lines can be of the following formats:

971

lines can be of the following formats:

971

972

syntax: regexp # defaults following lines to non-rooted regexps

973

syntax: regexp # defaults following lines to non-rooted regexps

973

syntax: glob # defaults following lines to non-rooted globs

974

syntax: glob # defaults following lines to non-rooted globs

974

re:pattern # non-rooted regular expression

975

re:pattern # non-rooted regular expression

975

glob:pattern # non-rooted glob

976

glob:pattern # non-rooted glob

976

pattern # pattern of the current default type

977

pattern # pattern of the current default type

977

978

if sourceinfo is set, returns a list of tuples:

979

if sourceinfo is set, returns a list of tuples:

979

(pattern, lineno, originalline). This is useful to debug ignore patterns.

980

(pattern, lineno, originalline). This is useful to debug ignore patterns.

980

'''

981

'''

981

982

syntaxes = {'re': 'relre:', 'regexp': 'relre:', 'glob': 'relglob:',

983

syntaxes = {'re': 'relre:', 'regexp': 'relre:', 'glob': 'relglob:',

983

'include': 'include', 'subinclude': 'subinclude'}

984

'include': 'include', 'subinclude': 'subinclude'}

984

syntax = 'relre:'

985

syntax = 'relre:'

985

patterns = []

986

patterns = []

986

987

fp = open(filepath, 'rb')

988

fp = open(filepath, 'rb')

988

for lineno, line in enumerate(util.iterfile(fp), start=1):

989

for lineno, line in enumerate(util.iterfile(fp), start=1):

989

if "#" in line:

990

if "#" in line:

990

global _commentre

991

global _commentre

991

if not _commentre:

992

if not _commentre:

992

_commentre = util.re.compile(br'((?:^|[^\\])(?:\\\\)*)#.*')

993

_commentre = util.re.compile(br'((?:^|[^\\])(?:\\\\)*)#.*')

993

# remove comments prefixed by an even number of escapes

994

# remove comments prefixed by an even number of escapes

994

m = _commentre.search(line)

995

m = _commentre.search(line)

995

if m:

996

if m:

996

line = line[:m.end(1)]

997

line = line[:m.end(1)]

997

# fixup properly escaped comments that survived the above

998

# fixup properly escaped comments that survived the above

998

line = line.replace("\\#", "#")

999

line = line.replace("\\#", "#")

999

line = line.rstrip()

1000

line = line.rstrip()

1000

if not line:

1001

if not line:

1001

continue

1002

continue

1002

1003

if line.startswith('syntax:'):

1004

if line.startswith('syntax:'):

1004

s = line[7:].strip()

1005

s = line[7:].strip()

1005

try:

1006

try:

1006

syntax = syntaxes[s]

1007

syntax = syntaxes[s]

1007

except KeyError:

1008

except KeyError:

1008

if warn:

1009

if warn:

1009

warn(_("%s: ignoring invalid syntax '%s'\n") %

1010

warn(_("%s: ignoring invalid syntax '%s'\n") %

1010

(filepath, s))

1011

(filepath, s))

1011

continue

1012

continue

1012

1013

linesyntax = syntax

1014

linesyntax = syntax

1014

for s, rels in syntaxes.iteritems():

1015

for s, rels in syntaxes.iteritems():

1015

if line.startswith(rels):

1016

if line.startswith(rels):

1016

linesyntax = rels

1017

linesyntax = rels

1017

line = line[len(rels):]

1018

line = line[len(rels):]

1018

break

1019

break

1019

elif line.startswith(s+':'):

1020

elif line.startswith(s+':'):

1020

linesyntax = rels

1021

linesyntax = rels

1021

line = line[len(s) + 1:]

1022

line = line[len(s) + 1:]

1022

break

1023

break

1023

if sourceinfo:

1024

if sourceinfo:

1024

patterns.append((linesyntax + line, lineno, line))

1025

patterns.append((linesyntax + line, lineno, line))

1025

else:

1026

else:

1026

patterns.append(linesyntax + line)

1027

patterns.append(linesyntax + line)

1027

fp.close()

1028

fp.close()

1028

return patterns

1029

return patterns

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # match.py - filename matching
             #
             #  Copyright 2008, 2009 Matt Mackall <mpm@selenic.com> and others
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import, print_function
             import copy
             import os
             import re
             from .i18n import _
             from . import (
                 encoding,
                 error,
                 pathutil,
+                pycompat,
                 util,
             )
             allpatternkinds = ('re', 'glob', 'path', 'relglob', 'relpath', 'relre',
                                'listfile', 'listfile0', 'set', 'include', 'subinclude',
                                'rootfilesin')
             cwdrelativepatternkinds = ('relpath', 'glob')
             propertycache = util.propertycache
             def _rematcher(regex):
                 '''compile the regexp with the best available regexp engine and return a
                 matcher function'''
                 m = util.re.compile(regex)
                 try:
                     # slightly faster, provided by facebook's re2 bindings
                     return m.test_match
                 except AttributeError:
                     return m.match
             def _expandsets(kindpats, ctx, listsubrepos):
                 '''Returns the kindpats list with the 'set' patterns expanded.'''
                 fset = set()
                 other = []
                 for kind, pat, source in kindpats:
                     if kind == 'set':
                         if not ctx:
                             raise error.ProgrammingError("fileset expression with no "
                                                          "context")
                         s = ctx.getfileset(pat)
                         fset.update(s)
                         if listsubrepos:
                             for subpath in ctx.substate:
                                 s = ctx.sub(subpath).getfileset(pat)
                                 fset.update(subpath + '/' + f for f in s)
                         continue
                     other.append((kind, pat, source))
                 return fset, other
             def _expandsubinclude(kindpats, root):
                 '''Returns the list of subinclude matcher args and the kindpats without the
                 subincludes in it.'''
                 relmatchers = []
                 other = []
                 for kind, pat, source in kindpats:
                     if kind == 'subinclude':
                         sourceroot = pathutil.dirname(util.normpath(source))
                         pat = util.pconvert(pat)
                         path = pathutil.join(sourceroot, pat)
                         newroot = pathutil.dirname(path)
                         matcherargs = (newroot, '', [], ['include:%s' % path])
                         prefix = pathutil.canonpath(root, root, newroot)
                         if prefix:
                             prefix += '/'
                         relmatchers.append((prefix, matcherargs))
                     else:
                         other.append((kind, pat, source))
                 return relmatchers, other
             def _kindpatsalwaysmatch(kindpats):
                 """"Checks whether the kindspats match everything, as e.g.
                 'relpath:.' does.
                 """
                 for kind, pat, source in kindpats:
                     if pat != '' or kind not in ['relpath', 'glob']:
                         return False
                 return True
             def match(root, cwd, patterns=None, include=None, exclude=None, default='glob',
                       exact=False, auditor=None, ctx=None, listsubrepos=False, warn=None,
                       badfn=None, icasefs=False):
                 """build an object to match a set of file patterns
                 arguments:
                 root - the canonical root of the tree you're matching against
                 cwd - the current working directory, if relevant
                 patterns - patterns to find
                 include - patterns to include (unless they are excluded)
                 exclude - patterns to exclude (even if they are included)
                 default - if a pattern in patterns has no explicit type, assume this one
                 exact - patterns are actually filenames (include/exclude still apply)
                 warn - optional function used for printing warnings
                 badfn - optional bad() callback for this matcher instead of the default
                 icasefs - make a matcher for wdir on case insensitive filesystems, which
                     normalizes the given patterns to the case in the filesystem
                 a pattern is one of:
                 'glob:<glob>' - a glob relative to cwd
                 're:<regexp>' - a regular expression
                 'path:<path>' - a path relative to repository root, which is matched
                                 recursively
                 'rootfilesin:<path>' - a path relative to repository root, which is
                                 matched non-recursively (will not match subdirectories)
                 'relglob:<glob>' - an unrooted glob (*.c matches C files in all dirs)
                 'relpath:<path>' - a path relative to cwd
                 'relre:<regexp>' - a regexp that needn't match the start of a name
                 'set:<fileset>' - a fileset expression
                 'include:<path>' - a file of patterns to read and include
                 'subinclude:<path>' - a file of patterns to match against files under
                                       the same directory
                 '<something>' - a pattern of the specified default type
                 """
                 normalize = _donormalize
                 if icasefs:
                     if exact:
                         raise error.ProgrammingError("a case-insensitive exact matcher "
                                                      "doesn't make sense")
                     dirstate = ctx.repo().dirstate
                     dsnormalize = dirstate.normalize
                     def normalize(patterns, default, root, cwd, auditor, warn):
                         kp = _donormalize(patterns, default, root, cwd, auditor, warn)
                         kindpats = []
                         for kind, pats, source in kp:
                             if kind not in ('re', 'relre'):  # regex can't be normalized
                                 p = pats
                                 pats = dsnormalize(pats)
                                 # Preserve the original to handle a case only rename.
                                 if p != pats and p in dirstate:
                                     kindpats.append((kind, p, source))
                             kindpats.append((kind, pats, source))
                         return kindpats
                 if exact:
                     m = exactmatcher(root, cwd, patterns, badfn)
                 elif patterns:
                     kindpats = normalize(patterns, default, root, cwd, auditor, warn)
                     if _kindpatsalwaysmatch(kindpats):
                         m = alwaysmatcher(root, cwd, badfn, relativeuipath=True)
                     else:
                         m = patternmatcher(root, cwd, kindpats, ctx=ctx,
                                            listsubrepos=listsubrepos, badfn=badfn)
                 else:
                     # It's a little strange that no patterns means to match everything.
                     # Consider changing this to match nothing (probably using nevermatcher).
                     m = alwaysmatcher(root, cwd, badfn)
                 if include:
                     kindpats = normalize(include, 'glob', root, cwd, auditor, warn)
                     im = includematcher(root, cwd, kindpats, ctx=ctx,
                                         listsubrepos=listsubrepos, badfn=None)
                     m = intersectmatchers(m, im)
                 if exclude:
                     kindpats = normalize(exclude, 'glob', root, cwd, auditor, warn)
                     em = includematcher(root, cwd, kindpats, ctx=ctx,
                                         listsubrepos=listsubrepos, badfn=None)
                     m = differencematcher(m, em)
                 return m
             def exact(root, cwd, files, badfn=None):
                 return exactmatcher(root, cwd, files, badfn=badfn)
             def always(root, cwd):
                 return alwaysmatcher(root, cwd)
             def never(root, cwd):
                 return nevermatcher(root, cwd)
             def badmatch(match, badfn):
                 """Make a copy of the given matcher, replacing its bad method with the given
                 one.
                 """
                 m = copy.copy(match)
                 m.bad = badfn
                 return m
             def _donormalize(patterns, default, root, cwd, auditor, warn):
                 '''Convert 'kind:pat' from the patterns list to tuples with kind and
                 normalized and rooted patterns and with listfiles expanded.'''
                 kindpats = []
                 for kind, pat in [_patsplit(p, default) for p in patterns]:
                     if kind in cwdrelativepatternkinds:
                         pat = pathutil.canonpath(root, cwd, pat, auditor)
                     elif kind in ('relglob', 'path', 'rootfilesin'):
                         pat = util.normpath(pat)
                     elif kind in ('listfile', 'listfile0'):
                         try:
                             files = util.readfile(pat)
                             if kind == 'listfile0':
                                 files = files.split('\0')
                             else:
                                 files = files.splitlines()
                             files = [f for f in files if f]
                         except EnvironmentError:
                             raise error.Abort(_("unable to read file list (%s)") % pat)
                         for k, p, source in _donormalize(files, default, root, cwd,
                                                          auditor, warn):
                             kindpats.append((k, p, pat))
                         continue
                     elif kind == 'include':
                         try:
                             fullpath = os.path.join(root, util.localpath(pat))
                             includepats = readpatternfile(fullpath, warn)
                             for k, p, source in _donormalize(includepats, default,
                                                              root, cwd, auditor, warn):
                                 kindpats.append((k, p, source or pat))
                         except error.Abort as inst:
                             raise error.Abort('%s: %s' % (pat, inst[0]))
                         except IOError as inst:
                             if warn:
                                 warn(_("skipping unreadable pattern file '%s': %s\n") %
-                                     (pat, inst.strerror))
+                                     (pat, util.forcebytestr(inst.strerror)))
                         continue
                     # else: re or relre - which cannot be normalized
                     kindpats.append((kind, pat, ''))
                 return kindpats
             class basematcher(object):
                 def __init__(self, root, cwd, badfn=None, relativeuipath=True):
                     self._root = root
                     self._cwd = cwd
                     if badfn is not None:
                         self.bad = badfn
                     self._relativeuipath = relativeuipath
                 def __call__(self, fn):
                     return self.matchfn(fn)
                 def __iter__(self):
                     for f in self._files:
                         yield f
                 # Callbacks related to how the matcher is used by dirstate.walk.
                 # Subscribers to these events must monkeypatch the matcher object.
                 def bad(self, f, msg):
                     '''Callback from dirstate.walk for each explicit file that can't be
                     found/accessed, with an error message.'''
                 # If an explicitdir is set, it will be called when an explicitly listed
                 # directory is visited.
                 explicitdir = None
                 # If an traversedir is set, it will be called when a directory discovered
                 # by recursive traversal is visited.
                 traversedir = None
                 def abs(self, f):
                     '''Convert a repo path back to path that is relative to the root of the
                     matcher.'''
                     return f
                 def rel(self, f):
                     '''Convert repo path back to path that is relative to cwd of matcher.'''
                     return util.pathto(self._root, self._cwd, f)
                 def uipath(self, f):
                     '''Convert repo path to a display path.  If patterns or -I/-X were used
                     to create this matcher, the display path will be relative to cwd.
                     Otherwise it is relative to the root of the repo.'''
                     return (self._relativeuipath and self.rel(f)) or self.abs(f)
                 @propertycache
                 def _files(self):
                     return []
                 def files(self):
                     '''Explicitly listed files or patterns or roots:
                     if no patterns or .always(): empty list,
                     if exact: list exact files,
                     if not .anypats(): list all files and dirs,
                     else: optimal roots'''
                     return self._files
                 @propertycache
                 def _fileset(self):
                     return set(self._files)
                 def exact(self, f):
                     '''Returns True if f is in .files().'''
                     return f in self._fileset
                 def matchfn(self, f):
                     return False
                 def visitdir(self, dir):
                     '''Decides whether a directory should be visited based on whether it
                     has potential matches in it or one of its subdirectories. This is
                     based on the match's primary, included, and excluded patterns.
                     Returns the string 'all' if the given directory and all subdirectories
                     should be visited. Otherwise returns True or False indicating whether
                     the given directory should be visited.
                     '''
                     return True
                 def always(self):
                     '''Matcher will match everything and .files() will be empty --
                     optimization might be possible.'''
                     return False
                 def isexact(self):
                     '''Matcher will match exactly the list of files in .files() --
                     optimization might be possible.'''
                     return False
                 def prefix(self):
                     '''Matcher will match the paths in .files() recursively --
                     optimization might be possible.'''
                     return False
                 def anypats(self):
                     '''None of .always(), .isexact(), and .prefix() is true --
                     optimizations will be difficult.'''
                     return not self.always() and not self.isexact() and not self.prefix()
             class alwaysmatcher(basematcher):
                 '''Matches everything.'''
                 def __init__(self, root, cwd, badfn=None, relativeuipath=False):
                     super(alwaysmatcher, self).__init__(root, cwd, badfn,
                                                         relativeuipath=relativeuipath)
                 def always(self):
                     return True
                 def matchfn(self, f):
                     return True
                 def visitdir(self, dir):
                     return 'all'
                 def __repr__(self):
                     return r'<alwaysmatcher>'
             class nevermatcher(basematcher):
                 '''Matches nothing.'''
                 def __init__(self, root, cwd, badfn=None):
                     super(nevermatcher, self).__init__(root, cwd, badfn)
                 # It's a little weird to say that the nevermatcher is an exact matcher
                 # or a prefix matcher, but it seems to make sense to let callers take
                 # fast paths based on either. There will be no exact matches, nor any
                 # prefixes (files() returns []), so fast paths iterating over them should
                 # be efficient (and correct).
                 def isexact(self):
                     return True
                 def prefix(self):
                     return True
                 def visitdir(self, dir):
                     return False
                 def __repr__(self):
                     return r'<nevermatcher>'
             class patternmatcher(basematcher):
                 def __init__(self, root, cwd, kindpats, ctx=None, listsubrepos=False,
                              badfn=None):
                     super(patternmatcher, self).__init__(root, cwd, badfn)
                     self._files = _explicitfiles(kindpats)
                     self._prefix = _prefix(kindpats)
                     self._pats, self.matchfn = _buildmatch(ctx, kindpats, '$', listsubrepos,
                                                            root)
                 @propertycache
                 def _dirs(self):
                     return set(util.dirs(self._fileset)) | {'.'}
                 def visitdir(self, dir):
                     if self._prefix and dir in self._fileset:
                         return 'all'
                     return ('.' in self._fileset or
                             dir in self._fileset or
                             dir in self._dirs or
                             any(parentdir in self._fileset
                                 for parentdir in util.finddirs(dir)))
                 def prefix(self):
                     return self._prefix
                 @encoding.strmethod
                 def __repr__(self):
                     return ('<patternmatcher patterns=%r>' % self._pats)
             class includematcher(basematcher):
                 def __init__(self, root, cwd, kindpats, ctx=None, listsubrepos=False,
                              badfn=None):
                     super(includematcher, self).__init__(root, cwd, badfn)
                     self._pats, self.matchfn = _buildmatch(ctx, kindpats, '(?:/|$)',
                                                            listsubrepos, root)
                     self._prefix = _prefix(kindpats)
                     roots, dirs = _rootsanddirs(kindpats)
                     # roots are directories which are recursively included.
                     self._roots = set(roots)
                     # dirs are directories which are non-recursively included.
                     self._dirs = set(dirs)
                 def visitdir(self, dir):
                     if self._prefix and dir in self._roots:
                         return 'all'
                     return ('.' in self._roots or
                             dir in self._roots or
                             dir in self._dirs or
                             any(parentdir in self._roots
                                 for parentdir in util.finddirs(dir)))
                 @encoding.strmethod
                 def __repr__(self):
-                    return ('<includematcher includes=%r>' % self._pats)
+                    return ('<includematcher includes=%r>' % pycompat.bytestr(self._pats))
             class exactmatcher(basematcher):
                 '''Matches the input files exactly. They are interpreted as paths, not
                 patterns (so no kind-prefixes).
                 '''
                 def __init__(self, root, cwd, files, badfn=None):
                     super(exactmatcher, self).__init__(root, cwd, badfn)
                     if isinstance(files, list):
                         self._files = files
                     else:
                         self._files = list(files)
                 matchfn = basematcher.exact
                 @propertycache
                 def _dirs(self):
                     return set(util.dirs(self._fileset)) | {'.'}
                 def visitdir(self, dir):
                     return dir in self._dirs
                 def isexact(self):
                     return True
                 @encoding.strmethod
                 def __repr__(self):
                     return ('<exactmatcher files=%r>' % self._files)
             class differencematcher(basematcher):
                 '''Composes two matchers by matching if the first matches and the second
                 does not.
                 The second matcher's non-matching-attributes (root, cwd, bad, explicitdir,
                 traversedir) are ignored.
                 '''
                 def __init__(self, m1, m2):
                     super(differencematcher, self).__init__(m1._root, m1._cwd)
                     self._m1 = m1
                     self._m2 = m2
                     self.bad = m1.bad
                     self.explicitdir = m1.explicitdir
                     self.traversedir = m1.traversedir
                 def matchfn(self, f):
                     return self._m1(f) and not self._m2(f)
                 @propertycache
                 def _files(self):
                     if self.isexact():
                         return [f for f in self._m1.files() if self(f)]
                     # If m1 is not an exact matcher, we can't easily figure out the set of
                     # files, because its files() are not always files. For example, if
                     # m1 is "path:dir" and m2 is "rootfileins:.", we don't
                     # want to remove "dir" from the set even though it would match m2,
                     # because the "dir" in m1 may not be a file.
                     return self._m1.files()
                 def visitdir(self, dir):
                     if self._m2.visitdir(dir) == 'all':
                         return False
                     return bool(self._m1.visitdir(dir))
                 def isexact(self):
                     return self._m1.isexact()
                 @encoding.strmethod
                 def __repr__(self):
                     return ('<differencematcher m1=%r, m2=%r>' % (self._m1, self._m2))
             def intersectmatchers(m1, m2):
                 '''Composes two matchers by matching if both of them match.
                 The second matcher's non-matching-attributes (root, cwd, bad, explicitdir,
                 traversedir) are ignored.
                 '''
                 if m1 is None or m2 is None:
                     return m1 or m2
                 if m1.always():
                     m = copy.copy(m2)
                     # TODO: Consider encapsulating these things in a class so there's only
                     # one thing to copy from m1.
                     m.bad = m1.bad
                     m.explicitdir = m1.explicitdir
                     m.traversedir = m1.traversedir
                     m.abs = m1.abs
                     m.rel = m1.rel
                     m._relativeuipath |= m1._relativeuipath
                     return m
                 if m2.always():
                     m = copy.copy(m1)
                     m._relativeuipath |= m2._relativeuipath
                     return m
                 return intersectionmatcher(m1, m2)
             class intersectionmatcher(basematcher):
                 def __init__(self, m1, m2):
                     super(intersectionmatcher, self).__init__(m1._root, m1._cwd)
                     self._m1 = m1
                     self._m2 = m2
                     self.bad = m1.bad
                     self.explicitdir = m1.explicitdir
                     self.traversedir = m1.traversedir
                 @propertycache
                 def _files(self):
                     if self.isexact():
                         m1, m2 = self._m1, self._m2
                         if not m1.isexact():
                             m1, m2 = m2, m1
                         return [f for f in m1.files() if m2(f)]
                     # It neither m1 nor m2 is an exact matcher, we can't easily intersect
                     # the set of files, because their files() are not always files. For
                     # example, if intersecting a matcher "-I glob:foo.txt" with matcher of
                     # "path:dir2", we don't want to remove "dir2" from the set.
                     return self._m1.files() + self._m2.files()
                 def matchfn(self, f):
                     return self._m1(f) and self._m2(f)
                 def visitdir(self, dir):
                     visit1 = self._m1.visitdir(dir)
                     if visit1 == 'all':
                         return self._m2.visitdir(dir)
                     # bool() because visit1=True + visit2='all' should not be 'all'
                     return bool(visit1 and self._m2.visitdir(dir))
                 def always(self):
                     return self._m1.always() and self._m2.always()
                 def isexact(self):
                     return self._m1.isexact() or self._m2.isexact()
                 @encoding.strmethod
                 def __repr__(self):
                     return ('<intersectionmatcher m1=%r, m2=%r>' % (self._m1, self._m2))
             class subdirmatcher(basematcher):
                 """Adapt a matcher to work on a subdirectory only.
                 The paths are remapped to remove/insert the path as needed:
                 >>> from . import pycompat
                 >>> m1 = match(b'root', b'', [b'a.txt', b'sub/b.txt'])
                 >>> m2 = subdirmatcher(b'sub', m1)
                 >>> bool(m2(b'a.txt'))
                 False
                 >>> bool(m2(b'b.txt'))
                 True
                 >>> bool(m2.matchfn(b'a.txt'))
                 False
                 >>> bool(m2.matchfn(b'b.txt'))
                 True
                 >>> m2.files()
                 ['b.txt']
                 >>> m2.exact(b'b.txt')
                 True
                 >>> util.pconvert(m2.rel(b'b.txt'))
                 'sub/b.txt'
                 >>> def bad(f, msg):
                 ...     print(pycompat.sysstr(b"%s: %s" % (f, msg)))
                 >>> m1.bad = bad
                 >>> m2.bad(b'x.txt', b'No such file')
                 sub/x.txt: No such file
                 >>> m2.abs(b'c.txt')
                 'sub/c.txt'
                 """
                 def __init__(self, path, matcher):
                     super(subdirmatcher, self).__init__(matcher._root, matcher._cwd)
                     self._path = path
                     self._matcher = matcher
                     self._always = matcher.always()
                     self._files = [f[len(path) + 1:] for f in matcher._files
                                    if f.startswith(path + "/")]
                     # If the parent repo had a path to this subrepo and the matcher is
                     # a prefix matcher, this submatcher always matches.
                     if matcher.prefix():
                         self._always = any(f == path for f in matcher._files)
                 def bad(self, f, msg):
                     self._matcher.bad(self._path + "/" + f, msg)
                 def abs(self, f):
                     return self._matcher.abs(self._path + "/" + f)
                 def rel(self, f):
                     return self._matcher.rel(self._path + "/" + f)
                 def uipath(self, f):
                     return self._matcher.uipath(self._path + "/" + f)
                 def matchfn(self, f):
                     # Some information is lost in the superclass's constructor, so we
                     # can not accurately create the matching function for the subdirectory
                     # from the inputs. Instead, we override matchfn() and visitdir() to
                     # call the original matcher with the subdirectory path prepended.
                     return self._matcher.matchfn(self._path + "/" + f)
                 def visitdir(self, dir):
                     if dir == '.':
                         dir = self._path
                     else:
                         dir = self._path + "/" + dir
                     return self._matcher.visitdir(dir)
                 def always(self):
                     return self._always
                 def prefix(self):
                     return self._matcher.prefix() and not self._always
                 @encoding.strmethod
                 def __repr__(self):
                     return ('<subdirmatcher path=%r, matcher=%r>' %
                             (self._path, self._matcher))
             class unionmatcher(basematcher):
                 """A matcher that is the union of several matchers.
                 The non-matching-attributes (root, cwd, bad, explicitdir, traversedir) are
                 taken from the first matcher.
                 """
                 def __init__(self, matchers):
                     m1 = matchers[0]
                     super(unionmatcher, self).__init__(m1._root, m1._cwd)
                     self.explicitdir = m1.explicitdir
                     self.traversedir = m1.traversedir
                     self._matchers = matchers
                 def matchfn(self, f):
                     for match in self._matchers:
                         if match(f):
                             return True
                     return False
                 def visitdir(self, dir):
                     r = False
                     for m in self._matchers:
                         v = m.visitdir(dir)
                         if v == 'all':
                             return v
                         r |= v
                     return r
                 @encoding.strmethod
                 def __repr__(self):
                     return ('<unionmatcher matchers=%r>' % self._matchers)
             def patkind(pattern, default=None):
                 '''If pattern is 'kind:pat' with a known kind, return kind.'''
                 return _patsplit(pattern, default)[0]
             def _patsplit(pattern, default):
                 """Split a string into the optional pattern kind prefix and the actual
                 pattern."""
                 if ':' in pattern:
                     kind, pat = pattern.split(':', 1)
                     if kind in allpatternkinds:
                         return kind, pat
                 return default, pattern
             def _globre(pat):
                 r'''Convert an extended glob string to a regexp string.
                 >>> from . import pycompat
                 >>> def bprint(s):
                 ...     print(pycompat.sysstr(s))
                 >>> bprint(_globre(br'?'))
                 .
                 >>> bprint(_globre(br'*'))
                 [^/]*
                 >>> bprint(_globre(br'**'))
                 .*
                 >>> bprint(_globre(br'**/a'))
                 (?:.*/)?a
                 >>> bprint(_globre(br'a/**/b'))
                 a\/(?:.*/)?b
                 >>> bprint(_globre(br'[a*?!^][^b][!c]'))
                 [a*?!^][\^b][^c]
                 >>> bprint(_globre(br'{a,b}'))
                 (?:a|b)
                 >>> bprint(_globre(br'.\*\?'))
                 \.\*\?
                 '''
                 i, n = 0, len(pat)
                 res = ''
                 group = 0
                 escape = util.re.escape
                 def peek():
                     return i < n and pat[i:i + 1]
                 while i < n:
                     c = pat[i:i + 1]
                     i += 1
                     if c not in '*?[{},\\':
                         res += escape(c)
                     elif c == '*':
                         if peek() == '*':
                             i += 1
                             if peek() == '/':
                                 i += 1
                                 res += '(?:.*/)?'
                             else:
                                 res += '.*'
                         else:
                             res += '[^/]*'
                     elif c == '?':
                         res += '.'
                     elif c == '[':
                         j = i
                         if j < n and pat[j:j + 1] in '!]':
                             j += 1
                         while j < n and pat[j:j + 1] != ']':
                             j += 1
                         if j >= n:
                             res += '\\['
                         else:
                             stuff = pat[i:j].replace('\\','\\\\')
                             i = j + 1
                             if stuff[0:1] == '!':
                                 stuff = '^' + stuff[1:]
                             elif stuff[0:1] == '^':
                                 stuff = '\\' + stuff
                             res = '%s[%s]' % (res, stuff)
                     elif c == '{':
                         group += 1
                         res += '(?:'
                     elif c == '}' and group:
                         res += ')'
                         group -= 1
                     elif c == ',' and group:
                         res += '|'
                     elif c == '\\':
                         p = peek()
                         if p:
                             i += 1
                             res += escape(p)
                         else:
                             res += escape(c)
                     else:
                         res += escape(c)
                 return res
             def _regex(kind, pat, globsuffix):
                 '''Convert a (normalized) pattern of any kind into a regular expression.
                 globsuffix is appended to the regexp of globs.'''
                 if not pat:
                     return ''
                 if kind == 're':
                     return pat
                 if kind in ('path', 'relpath'):
                     if pat == '.':
                         return ''
                     return util.re.escape(pat) + '(?:/|$)'
                 if kind == 'rootfilesin':
                     if pat == '.':
                         escaped = ''
                     else:
                         # Pattern is a directory name.
                         escaped = util.re.escape(pat) + '/'
                     # Anything after the pattern must be a non-directory.
                     return escaped + '[^/]+$'
                 if kind == 'relglob':
                     return '(?:|.*/)' + _globre(pat) + globsuffix
                 if kind == 'relre':
                     if pat.startswith('^'):
                         return pat
                     return '.*' + pat
                 return _globre(pat) + globsuffix
             def _buildmatch(ctx, kindpats, globsuffix, listsubrepos, root):
                 '''Return regexp string and a matcher function for kindpats.
                 globsuffix is appended to the regexp of globs.'''
                 matchfuncs = []
                 subincludes, kindpats = _expandsubinclude(kindpats, root)
                 if subincludes:
                     submatchers = {}
                     def matchsubinclude(f):
                         for prefix, matcherargs in subincludes:
                             if f.startswith(prefix):
                                 mf = submatchers.get(prefix)
                                 if mf is None:
                                     mf = match(*matcherargs)
                                     submatchers[prefix] = mf
                                 if mf(f[len(prefix):]):
                                     return True
                         return False
                     matchfuncs.append(matchsubinclude)
                 fset, kindpats = _expandsets(kindpats, ctx, listsubrepos)
                 if fset:
                     matchfuncs.append(fset.__contains__)
                 regex = ''
                 if kindpats:
                     regex, mf = _buildregexmatch(kindpats, globsuffix)
                     matchfuncs.append(mf)
                 if len(matchfuncs) == 1:
                     return regex, matchfuncs[0]
                 else:
                     return regex, lambda f: any(mf(f) for mf in matchfuncs)
             def _buildregexmatch(kindpats, globsuffix):
                 """Build a match function from a list of kinds and kindpats,
                 return regexp string and a matcher function."""
                 try:
                     regex = '(?:%s)' % '|'.join([_regex(k, p, globsuffix)
                                                  for (k, p, s) in kindpats])
                     if len(regex) > 20000:
                         raise OverflowError
                     return regex, _rematcher(regex)
                 except OverflowError:
                     # We're using a Python with a tiny regex engine and we
                     # made it explode, so we'll divide the pattern list in two
                     # until it works
                     l = len(kindpats)
                     if l < 2:
                         raise
                     regexa, a = _buildregexmatch(kindpats[:l//2], globsuffix)
                     regexb, b = _buildregexmatch(kindpats[l//2:], globsuffix)
                     return regex, lambda s: a(s) or b(s)
                 except re.error:
                     for k, p, s in kindpats:
                         try:
                             _rematcher('(?:%s)' % _regex(k, p, globsuffix))
                         except re.error:
                             if s:
                                 raise error.Abort(_("%s: invalid pattern (%s): %s") %
                                                  (s, k, p))
                             else:
                                 raise error.Abort(_("invalid pattern (%s): %s") % (k, p))
                     raise error.Abort(_("invalid pattern"))
             def _patternrootsanddirs(kindpats):
                 '''Returns roots and directories corresponding to each pattern.
                 This calculates the roots and directories exactly matching the patterns and
                 returns a tuple of (roots, dirs) for each. It does not return other
                 directories which may also need to be considered, like the parent
                 directories.
                 '''
                 r = []
                 d = []
                 for kind, pat, source in kindpats:
                     if kind == 'glob': # find the non-glob prefix
                         root = []
                         for p in pat.split('/'):
                             if '[' in p or '{' in p or '*' in p or '?' in p:
                                 break
                             root.append(p)
                         r.append('/'.join(root) or '.')
                     elif kind in ('relpath', 'path'):
                         r.append(pat or '.')
                     elif kind in ('rootfilesin',):
                         d.append(pat or '.')
                     else: # relglob, re, relre
                         r.append('.')
                 return r, d
             def _roots(kindpats):
                 '''Returns root directories to match recursively from the given patterns.'''
                 roots, dirs = _patternrootsanddirs(kindpats)
                 return roots
             def _rootsanddirs(kindpats):
                 '''Returns roots and exact directories from patterns.
                 roots are directories to match recursively, whereas exact directories should
                 be matched non-recursively. The returned (roots, dirs) tuple will also
                 include directories that need to be implicitly considered as either, such as
                 parent directories.
                 >>> _rootsanddirs(
                 ...     [(b'glob', b'g/h/*', b''), (b'glob', b'g/h', b''),
                 ...      (b'glob', b'g*', b'')])
                 (['g/h', 'g/h', '.'], ['g', '.'])
                 >>> _rootsanddirs(
                 ...     [(b'rootfilesin', b'g/h', b''), (b'rootfilesin', b'', b'')])
                 ([], ['g/h', '.', 'g', '.'])
                 >>> _rootsanddirs(
                 ...     [(b'relpath', b'r', b''), (b'path', b'p/p', b''),
                 ...      (b'path', b'', b'')])
                 (['r', 'p/p', '.'], ['p', '.'])
                 >>> _rootsanddirs(
                 ...     [(b'relglob', b'rg*', b''), (b're', b're/', b''),
                 ...      (b'relre', b'rr', b'')])
                 (['.', '.', '.'], ['.'])
                 '''
                 r, d = _patternrootsanddirs(kindpats)
                 # Append the parents as non-recursive/exact directories, since they must be
                 # scanned to get to either the roots or the other exact directories.
                 d.extend(util.dirs(d))
                 d.extend(util.dirs(r))
                 # util.dirs() does not include the root directory, so add it manually
                 d.append('.')
                 return r, d
             def _explicitfiles(kindpats):
                 '''Returns the potential explicit filenames from the patterns.
                 >>> _explicitfiles([(b'path', b'foo/bar', b'')])
                 ['foo/bar']
                 >>> _explicitfiles([(b'rootfilesin', b'foo/bar', b'')])
                 []
                 '''
                 # Keep only the pattern kinds where one can specify filenames (vs only
                 # directory names).
                 filable = [kp for kp in kindpats if kp[0] not in ('rootfilesin',)]
                 return _roots(filable)
             def _prefix(kindpats):
                 '''Whether all the patterns match a prefix (i.e. recursively)'''
                 for kind, pat, source in kindpats:
                     if kind not in ('path', 'relpath'):
                         return False
                 return True
             _commentre = None
             def readpatternfile(filepath, warn, sourceinfo=False):
                 '''parse a pattern file, returning a list of
                 patterns. These patterns should be given to compile()
                 to be validated and converted into a match function.
                 trailing white space is dropped.
                 the escape character is backslash.
                 comments start with #.
                 empty lines are skipped.
                 lines can be of the following formats:
                 syntax: regexp # defaults following lines to non-rooted regexps
                 syntax: glob   # defaults following lines to non-rooted globs
                 re:pattern     # non-rooted regular expression
                 glob:pattern   # non-rooted glob
                 pattern        # pattern of the current default type
                 if sourceinfo is set, returns a list of tuples:
                 (pattern, lineno, originalline). This is useful to debug ignore patterns.
                 '''
                 syntaxes = {'re': 'relre:', 'regexp': 'relre:', 'glob': 'relglob:',
                             'include': 'include', 'subinclude': 'subinclude'}
                 syntax = 'relre:'
                 patterns = []
                 fp = open(filepath, 'rb')
                 for lineno, line in enumerate(util.iterfile(fp), start=1):
                     if "#" in line:
                         global _commentre
                         if not _commentre:
                             _commentre = util.re.compile(br'((?:^|[^\\])(?:\\\\)*)#.*')
                         # remove comments prefixed by an even number of escapes
                         m = _commentre.search(line)
                         if m:
                             line = line[:m.end(1)]
                         # fixup properly escaped comments that survived the above
                         line = line.replace("\\#", "#")
                     line = line.rstrip()
                     if not line:
                         continue
                     if line.startswith('syntax:'):
                         s = line[7:].strip()
                         try:
                             syntax = syntaxes[s]
                         except KeyError:
                             if warn:
                                 warn(_("%s: ignoring invalid syntax '%s'\n") %
                                      (filepath, s))
                         continue
                     linesyntax = syntax
                     for s, rels in syntaxes.iteritems():
                         if line.startswith(rels):
                             linesyntax = rels
                             line = line[len(rels):]
                             break
                         elif line.startswith(s+':'):
                             linesyntax = rels
                             line = line[len(s) + 1:]
                             break
                     if sourceinfo:
                         patterns.append((linesyntax + line, lineno, line))
                     else:
                         patterns.append(linesyntax + line)
                 fp.close()
                 return patterns