upstream/mercurial-mirror Commit - r43805:1a47fe4b

1

# branchmap.py - logic to computes, maintain and stores branchmap for local repo

1

# branchmap.py - logic to computes, maintain and stores branchmap for local repo

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from __future__ import absolute_import

8

from __future__ import absolute_import

9

10

import struct

10

import struct

11

12

from .node import (

12

from .node import (

13

bin,

13

bin,

14

hex,

14

hex,

15

nullid,

15

nullid,

16

nullrev,

16

nullrev,

17

)

17

)

18

from . import (

18

from . import (

19

encoding,

19

encoding,

20

error,

20

error,

21

pycompat,

21

pycompat,

22

scmutil,

22

scmutil,

23

util,

23

util,

24

)

24

)

25

from .utils import (

25

from .utils import (

26

repoviewutil,

26

repoviewutil,

27

stringutil,

27

stringutil,

28

)

28

)

29

30

subsettable = repoviewutil.subsettable

30

subsettable = repoviewutil.subsettable

31

32

calcsize = struct.calcsize

32

calcsize = struct.calcsize

33

pack_into = struct.pack_into

33

pack_into = struct.pack_into

34

unpack_from = struct.unpack_from

34

unpack_from = struct.unpack_from

35

36

37

class BranchMapCache(object):

37

class BranchMapCache(object):

38

"""mapping of filtered views of repo with their branchcache"""

38

"""mapping of filtered views of repo with their branchcache"""

39

40

def __init__(self):

40

def __init__(self):

41

self._per_filter = {}

41

self._per_filter = {}

42

43

def __getitem__(self, repo):

43

def __getitem__(self, repo):

44

self.updatecache(repo)

44

self.updatecache(repo)

45

return self._per_filter[repo.filtername]

45

return self._per_filter[repo.filtername]

46

47

def updatecache(self, repo):

47

def updatecache(self, repo):

48

"""Update the cache for the given filtered view on a repository"""

48

"""Update the cache for the given filtered view on a repository"""

49

# This can trigger updates for the caches for subsets of the filtered

49

# This can trigger updates for the caches for subsets of the filtered

50

# view, e.g. when there is no cache for this filtered view or the cache

50

# view, e.g. when there is no cache for this filtered view or the cache

51

# is stale.

51

# is stale.

52

53

cl = repo.changelog

53

cl = repo.changelog

54

filtername = repo.filtername

54

filtername = repo.filtername

55

bcache = self._per_filter.get(filtername)

55

bcache = self._per_filter.get(filtername)

56

if bcache is None or not bcache.validfor(repo):

56

if bcache is None or not bcache.validfor(repo):

57

# cache object missing or cache object stale? Read from disk

57

# cache object missing or cache object stale? Read from disk

58

bcache = branchcache.fromfile(repo)

58

bcache = branchcache.fromfile(repo)

59

60

revs = []

60

revs = []

61

if bcache is None:

61

if bcache is None:

62

# no (fresh) cache available anymore, perhaps we can re-use

62

# no (fresh) cache available anymore, perhaps we can re-use

63

# the cache for a subset, then extend that to add info on missing

63

# the cache for a subset, then extend that to add info on missing

64

# revisions.

64

# revisions.

65

subsetname = subsettable.get(filtername)

65

subsetname = subsettable.get(filtername)

66

if subsetname is not None:

66

if subsetname is not None:

67

subset = repo.filtered(subsetname)

67

subset = repo.filtered(subsetname)

68

bcache = self[subset].copy()

68

bcache = self[subset].copy()

69

extrarevs = subset.changelog.filteredrevs - cl.filteredrevs

69

extrarevs = subset.changelog.filteredrevs - cl.filteredrevs

70

revs.extend(r for r in extrarevs if r <= bcache.tiprev)

70

revs.extend(r for r in extrarevs if r <= bcache.tiprev)

71

else:

71

else:

72

# nothing to fall back on, start empty.

72

# nothing to fall back on, start empty.

73

bcache = branchcache()

73

bcache = branchcache()

74

75

revs.extend(cl.revs(start=bcache.tiprev + 1))

75

revs.extend(cl.revs(start=bcache.tiprev + 1))

76

if revs:

76

if revs:

77

bcache.update(repo, revs)

77

bcache.update(repo, revs)

78

79

assert bcache.validfor(repo), filtername

79

assert bcache.validfor(repo), filtername

80

self._per_filter[repo.filtername] = bcache

80

self._per_filter[repo.filtername] = bcache

81

82

def replace(self, repo, remotebranchmap):

82

def replace(self, repo, remotebranchmap):

83

"""Replace the branchmap cache for a repo with a branch mapping.

83

"""Replace the branchmap cache for a repo with a branch mapping.

84

85

This is likely only called during clone with a branch map from a

85

This is likely only called during clone with a branch map from a

86

remote.

86

remote.

87

88

"""

88

"""

89

cl = repo.changelog

89

cl = repo.changelog

90

clrev = cl.rev

90

clrev = cl.rev

91

clbranchinfo = cl.branchinfo

91

clbranchinfo = cl.branchinfo

92

rbheads = []

92

rbheads = []

93

closed = []

93

closed = []

94

for bheads in pycompat.itervalues(remotebranchmap):

94

for bheads in pycompat.itervalues(remotebranchmap):

95

rbheads += bheads

95

rbheads += bheads

96

for h in bheads:

96

for h in bheads:

97

r = clrev(h)

97

r = clrev(h)

98

b, c = clbranchinfo(r)

98

b, c = clbranchinfo(r)

99

if c:

99

if c:

100

closed.append(h)

100

closed.append(h)

101

102

if rbheads:

102

if rbheads:

103

rtiprev = max((int(clrev(node)) for node in rbheads))

103

rtiprev = max((int(clrev(node)) for node in rbheads))

104

cache = branchcache(

104

cache = branchcache(

105

remotebranchmap,

105

remotebranchmap,

106

repo[rtiprev].node(),

106

repo[rtiprev].node(),

107

rtiprev,

107

rtiprev,

108

closednodes=closed,

108

closednodes=closed,

109

)

109

)

110

111

# Try to stick it as low as possible

111

# Try to stick it as low as possible

112

# filter above served are unlikely to be fetch from a clone

112

# filter above served are unlikely to be fetch from a clone

113

for candidate in (b'base', b'immutable', b'served'):

113

for candidate in (b'base', b'immutable', b'served'):

114

rview = repo.filtered(candidate)

114

rview = repo.filtered(candidate)

115

if cache.validfor(rview):

115

if cache.validfor(rview):

116

self._per_filter[candidate] = cache

116

self._per_filter[candidate] = cache

117

cache.write(rview)

117

cache.write(rview)

118

return

118

return

119

120

def clear(self):

120

def clear(self):

121

self._per_filter.clear()

121

self._per_filter.clear()

122

123

124

def _unknownnode(node):

124

def _unknownnode(node):

125

""" raises ValueError when branchcache found a node which does not exists

125

""" raises ValueError when branchcache found a node which does not exists

126

"""

126

"""

127

raise ValueError(r'node %s does not exist' % pycompat.sysstr(hex(node)))

127

raise ValueError(r'node %s does not exist' % pycompat.sysstr(hex(node)))

128

129

130

def _branchcachedesc(repo):

130

def _branchcachedesc(repo):

131

if repo.filtername is not None:

131

if repo.filtername is not None:

132

return b'branch cache (%s)' % repo.filtername

132

return b'branch cache (%s)' % repo.filtername

133

else:

133

else:

134

return b'branch cache'

134

return b'branch cache'

135

136

137

class branchcache(object):

137

class branchcache(object):

138

"""A dict like object that hold branches heads cache.

138

"""A dict like object that hold branches heads cache.

139

140

This cache is used to avoid costly computations to determine all the

140

This cache is used to avoid costly computations to determine all the

141

branch heads of a repo.

141

branch heads of a repo.

142

143

The cache is serialized on disk in the following format:

143

The cache is serialized on disk in the following format:

144

145

<tip hex node> <tip rev number> [optional filtered repo hex hash]

145

<tip hex node> <tip rev number> [optional filtered repo hex hash]

146

146

147

147

148

...

148

...

149

150

The first line is used to check if the cache is still valid. If the

150

The first line is used to check if the cache is still valid. If the

151

branch cache is for a filtered repo view, an optional third hash is

151

branch cache is for a filtered repo view, an optional third hash is

152

included that hashes the hashes of all filtered revisions.

152

included that hashes the hashes of all filtered revisions.

153

154

The open/closed state is represented by a single letter 'o' or 'c'.

154

The open/closed state is represented by a single letter 'o' or 'c'.

155

This field can be used to avoid changelog reads when determining if a

155

This field can be used to avoid changelog reads when determining if a

156

branch head closes a branch or not.

156

branch head closes a branch or not.

157

"""

157

"""

158

159

def __init__(

159

def __init__(

160

self,

160

self,

161

entries=(),

161

entries=(),

162

tipnode=nullid,

162

tipnode=nullid,

163

tiprev=nullrev,

163

tiprev=nullrev,

164

filteredhash=None,

164

filteredhash=None,

165

closednodes=None,

165

closednodes=None,

166

hasnode=None,

166

hasnode=None,

167

):

167

):

168

""" hasnode is a function which can be used to verify whether changelog

168

""" hasnode is a function which can be used to verify whether changelog

169

has a given node or not. If it's not provided, we assume that every node

169

has a given node or not. If it's not provided, we assume that every node

170

we have exists in changelog """

170

we have exists in changelog """

171

self.tipnode = tipnode

171

self.tipnode = tipnode

172

self.tiprev = tiprev

172

self.tiprev = tiprev

173

self.filteredhash = filteredhash

173

self.filteredhash = filteredhash

174

# closednodes is a set of nodes that close their branch. If the branch

174

# closednodes is a set of nodes that close their branch. If the branch

175

# cache has been updated, it may contain nodes that are no longer

175

# cache has been updated, it may contain nodes that are no longer

176

# heads.

176

# heads.

177

if closednodes is None:

177

if closednodes is None:

178

self._closednodes = set()

178

self._closednodes = set()

179

else:

179

else:

180

self._closednodes = closednodes

180

self._closednodes = closednodes

181

self._entries = dict(entries)

181

self._entries = dict(entries)

182

# whether closed nodes are verified or not

182

# whether closed nodes are verified or not

183

self._closedverified = False

183

self._closedverified = False

184

# branches for which nodes are verified

184

# branches for which nodes are verified

185

self._verifiedbranches = set()

185

self._verifiedbranches = set()

186

self._hasnode = hasnode

186

self._hasnode = hasnode

187

if self._hasnode is None:

187

if self._hasnode is None:

188

self._hasnode = lambda x: True

188

self._hasnode = lambda x: True

189

190

def _verifyclosed(self):

190

def _verifyclosed(self):

191

""" verify the closed nodes we have """

191

""" verify the closed nodes we have """

192

if self._closedverified:

192

if self._closedverified:

193

return

193

return

194

for node in self._closednodes:

194

for node in self._closednodes:

195

if not self._hasnode(node):

195

if not self._hasnode(node):

196

_unknownnode(node)

196

_unknownnode(node)

197

198

self._closedverified = True

198

self._closedverified = True

199

200

def _verifybranch(self, branch):

200

def _verifybranch(self, branch):

201

""" verify head nodes for the given branch. """

201

""" verify head nodes for the given branch. """

202

if branch not in self._entries or branch in self._verifiedbranches:

202

if branch not in self._entries or branch in self._verifiedbranches:

203

return

203

return

204

for n in self._entries[branch]:

204

for n in self._entries[branch]:

205

if not self._hasnode(n):

205

if not self._hasnode(n):

206

_unknownnode(n)

206

_unknownnode(n)

207

208

self._verifiedbranches.add(branch)

208

self._verifiedbranches.add(branch)

209

210

def _verifyall(self):

210

def _verifyall(self):

211

""" verifies nodes of all the branches """

211

""" verifies nodes of all the branches """

212

needverification = set(self._entries.keys()) - self._verifiedbranches

212

needverification = set(self._entries.keys()) - self._verifiedbranches

213

for b in needverification:

213

for b in needverification:

214

self._verifybranch(b)

214

self._verifybranch(b)

215

216

def __iter__(self):

216

def __iter__(self):

217

return iter(self._entries)

217

return iter(self._entries)

218

219

def __setitem__(self, key, value):

219

def __setitem__(self, key, value):

220

self._entries[key] = value

220

self._entries[key] = value

221

222

def __getitem__(self, key):

222

def __getitem__(self, key):

223

self._verifybranch(key)

223

self._verifybranch(key)

224

return self._entries[key]

224

return self._entries[key]

225

226

def __contains__(self, key):

226

def __contains__(self, key):

227

self._verifybranch(key)

227

self._verifybranch(key)

228

return key in self._entries

228

return key in self._entries

229

230

def iteritems(self):

230

def iteritems(self):

231

for k, v in pycompat.iteritems(self._entries):

231

for k, v in pycompat.iteritems(self._entries):

232

self._verifybranch(k)

232

self._verifybranch(k)

233

yield k, v

233

yield k, v

234

235

items = iteritems

235

items = iteritems

236

237

def hasbranch(self, label):

237

def hasbranch(self, label):

238

""" checks whether a branch of this name exists or not """

238

""" checks whether a branch of this name exists or not """

239

self._verifybranch(label)

239

self._verifybranch(label)

240

return label in self._entries

240

return label in self._entries

241

242

@classmethod

242

@classmethod

243

def fromfile(cls, repo):

243

def fromfile(cls, repo):

244

f = None

244

f = None

245

try:

245

try:

246

f = repo.cachevfs(cls._filename(repo))

246

f = repo.cachevfs(cls._filename(repo))

247

lineiter = iter(f)

247

lineiter = iter(f)

248

cachekey = next(lineiter).rstrip(b'\n').split(b" ", 2)

248

cachekey = next(lineiter).rstrip(b'\n').split(b" ", 2)

249

last, lrev = cachekey[:2]

249

last, lrev = cachekey[:2]

250

last, lrev = bin(last), int(lrev)

250

last, lrev = bin(last), int(lrev)

251

filteredhash = None

251

filteredhash = None

252

hasnode = repo.changelog.hasnode

252

hasnode = repo.changelog.hasnode

253

if len(cachekey) > 2:

253

if len(cachekey) > 2:

254

filteredhash = bin(cachekey[2])

254

filteredhash = bin(cachekey[2])

255

bcache = cls(

255

bcache = cls(

256

tipnode=last,

256

tipnode=last,

257

tiprev=lrev,

257

tiprev=lrev,

258

filteredhash=filteredhash,

258

filteredhash=filteredhash,

259

hasnode=hasnode,

259

hasnode=hasnode,

260

)

260

)

261

if not bcache.validfor(repo):

261

if not bcache.validfor(repo):

262

# invalidate the cache

262

# invalidate the cache

263

raise ValueError(r'tip differs')

263

raise ValueError(r'tip differs')

264

bcache.load(repo, lineiter)

264

bcache.load(repo, lineiter)

265

except (IOError, OSError):

265

except (IOError, OSError):

266

return None

266

return None

267

268

except Exception as inst:

268

except Exception as inst:

269

if repo.ui.debugflag:

269

if repo.ui.debugflag:

270

msg = b'invalid %s: %s\n'

270

msg = b'invalid %s: %s\n'

271

repo.ui.debug(

271

repo.ui.debug(

272

msg % (_branchcachedesc(repo), pycompat.bytestr(inst))

272

msg

273

% (

274

_branchcachedesc(repo),

275

pycompat.bytestr(

276

inst # pytype: disable=wrong-arg-types

277

),

278

)

273

)

279

)

274

bcache = None

280

bcache = None

275

281

276

finally:

282

finally:

277

if f:

283

if f:

278

f.close()

284

f.close()

279

285

280

return bcache

286

return bcache

281

287

282

def load(self, repo, lineiter):

288

def load(self, repo, lineiter):

283

""" fully loads the branchcache by reading from the file using the line

289

""" fully loads the branchcache by reading from the file using the line

284

iterator passed"""

290

iterator passed"""

285

for line in lineiter:

291

for line in lineiter:

286

line = line.rstrip(b'\n')

292

line = line.rstrip(b'\n')

287

if not line:

293

if not line:

288

continue

294

continue

289

node, state, label = line.split(b" ", 2)

295

node, state, label = line.split(b" ", 2)

290

if state not in b'oc':

296

if state not in b'oc':

291

raise ValueError(r'invalid branch state')

297

raise ValueError(r'invalid branch state')

292

label = encoding.tolocal(label.strip())

298

label = encoding.tolocal(label.strip())

293

node = bin(node)

299

node = bin(node)

294

self._entries.setdefault(label, []).append(node)

300

self._entries.setdefault(label, []).append(node)

295

if state == b'c':

301

if state == b'c':

296

self._closednodes.add(node)

302

self._closednodes.add(node)

297

303

298

@staticmethod

304

@staticmethod

299

def _filename(repo):

305

def _filename(repo):

300

"""name of a branchcache file for a given repo or repoview"""

306

"""name of a branchcache file for a given repo or repoview"""

301

filename = b"branch2"

307

filename = b"branch2"

302

if repo.filtername:

308

if repo.filtername:

303

filename = b'%s-%s' % (filename, repo.filtername)

309

filename = b'%s-%s' % (filename, repo.filtername)

304

return filename

310

return filename

305

311

306

def validfor(self, repo):

312

def validfor(self, repo):

307

"""Is the cache content valid regarding a repo

313

"""Is the cache content valid regarding a repo

308

314

309

- False when cached tipnode is unknown or if we detect a strip.

315

- False when cached tipnode is unknown or if we detect a strip.

310

- True when cache is up to date or a subset of current repo."""

316

- True when cache is up to date or a subset of current repo."""

311

try:

317

try:

312

return (self.tipnode == repo.changelog.node(self.tiprev)) and (

318

return (self.tipnode == repo.changelog.node(self.tiprev)) and (

313

self.filteredhash == scmutil.filteredhash(repo, self.tiprev)

319

self.filteredhash == scmutil.filteredhash(repo, self.tiprev)

314

)

320

)

315

except IndexError:

321

except IndexError:

316

return False

322

return False

317

323

318

def _branchtip(self, heads):

324

def _branchtip(self, heads):

319

'''Return tuple with last open head in heads and false,

325

'''Return tuple with last open head in heads and false,

320

otherwise return last closed head and true.'''

326

otherwise return last closed head and true.'''

321

tip = heads[-1]

327

tip = heads[-1]

322

closed = True

328

closed = True

323

for h in reversed(heads):

329

for h in reversed(heads):

324

if h not in self._closednodes:

330

if h not in self._closednodes:

325

tip = h

331

tip = h

326

closed = False

332

closed = False

327

break

333

break

328

return tip, closed

334

return tip, closed

329

335

330

def branchtip(self, branch):

336

def branchtip(self, branch):

331

'''Return the tipmost open head on branch head, otherwise return the

337

'''Return the tipmost open head on branch head, otherwise return the

332

tipmost closed head on branch.

338

tipmost closed head on branch.

333

Raise KeyError for unknown branch.'''

339

Raise KeyError for unknown branch.'''

334

return self._branchtip(self[branch])[0]

340

return self._branchtip(self[branch])[0]

335

341

336

def iteropen(self, nodes):

342

def iteropen(self, nodes):

337

return (n for n in nodes if n not in self._closednodes)

343

return (n for n in nodes if n not in self._closednodes)

338

344

339

def branchheads(self, branch, closed=False):

345

def branchheads(self, branch, closed=False):

340

self._verifybranch(branch)

346

self._verifybranch(branch)

341

heads = self._entries[branch]

347

heads = self._entries[branch]

342

if not closed:

348

if not closed:

343

heads = list(self.iteropen(heads))

349

heads = list(self.iteropen(heads))

344

return heads

350

return heads

345

351

346

def iterbranches(self):

352

def iterbranches(self):

347

for bn, heads in pycompat.iteritems(self):

353

for bn, heads in pycompat.iteritems(self):

348

yield (bn, heads) + self._branchtip(heads)

354

yield (bn, heads) + self._branchtip(heads)

349

355

350

def iterheads(self):

356

def iterheads(self):

351

""" returns all the heads """

357

""" returns all the heads """

352

self._verifyall()

358

self._verifyall()

353

return pycompat.itervalues(self._entries)

359

return pycompat.itervalues(self._entries)

354

360

355

def copy(self):

361

def copy(self):

356

"""return an deep copy of the branchcache object"""

362

"""return an deep copy of the branchcache object"""

357

return type(self)(

363

return type(self)(

358

self._entries,

364

self._entries,

359

self.tipnode,

365

self.tipnode,

360

self.tiprev,

366

self.tiprev,

361

self.filteredhash,

367

self.filteredhash,

362

self._closednodes,

368

self._closednodes,

363

)

369

)

364

370

365

def write(self, repo):

371

def write(self, repo):

366

try:

372

try:

367

f = repo.cachevfs(self._filename(repo), b"w", atomictemp=True)

373

f = repo.cachevfs(self._filename(repo), b"w", atomictemp=True)

368

cachekey = [hex(self.tipnode), b'%d' % self.tiprev]

374

cachekey = [hex(self.tipnode), b'%d' % self.tiprev]

369

if self.filteredhash is not None:

375

if self.filteredhash is not None:

370

cachekey.append(hex(self.filteredhash))

376

cachekey.append(hex(self.filteredhash))

371

f.write(b" ".join(cachekey) + b'\n')

377

f.write(b" ".join(cachekey) + b'\n')

372

nodecount = 0

378

nodecount = 0

373

for label, nodes in sorted(pycompat.iteritems(self._entries)):

379

for label, nodes in sorted(pycompat.iteritems(self._entries)):

374

label = encoding.fromlocal(label)

380

label = encoding.fromlocal(label)

375

for node in nodes:

381

for node in nodes:

376

nodecount += 1

382

nodecount += 1

377

if node in self._closednodes:

383

if node in self._closednodes:

378

state = b'c'

384

state = b'c'

379

else:

385

else:

380

state = b'o'

386

state = b'o'

381

f.write(b"%s %s %s\n" % (hex(node), state, label))

387

f.write(b"%s %s %s\n" % (hex(node), state, label))

382

f.close()

388

f.close()

383

repo.ui.log(

389

repo.ui.log(

384

b'branchcache',

390

b'branchcache',

385

b'wrote %s with %d labels and %d nodes\n',

391

b'wrote %s with %d labels and %d nodes\n',

386

_branchcachedesc(repo),

392

_branchcachedesc(repo),

387

len(self._entries),

393

len(self._entries),

388

nodecount,

394

nodecount,

389

)

395

)

390

except (IOError, OSError, error.Abort) as inst:

396

except (IOError, OSError, error.Abort) as inst:

391

# Abort may be raised by read only opener, so log and continue

397

# Abort may be raised by read only opener, so log and continue

392

repo.ui.debug(

398

repo.ui.debug(

393

b"couldn't write branch cache: %s\n"

399

b"couldn't write branch cache: %s\n"

394

% stringutil.forcebytestr(inst)

400

% stringutil.forcebytestr(inst)

395

)

401

)

396

402

397

def update(self, repo, revgen):

403

def update(self, repo, revgen):

398

"""Given a branchhead cache, self, that may have extra nodes or be

404

"""Given a branchhead cache, self, that may have extra nodes or be

399

missing heads, and a generator of nodes that are strictly a superset of

405

missing heads, and a generator of nodes that are strictly a superset of

400

heads missing, this function updates self to be correct.

406

heads missing, this function updates self to be correct.

401

"""

407

"""

402

starttime = util.timer()

408

starttime = util.timer()

403

cl = repo.changelog

409

cl = repo.changelog

404

# collect new branch entries

410

# collect new branch entries

405

newbranches = {}

411

newbranches = {}

406

getbranchinfo = repo.revbranchcache().branchinfo

412

getbranchinfo = repo.revbranchcache().branchinfo

407

for r in revgen:

413

for r in revgen:

408

branch, closesbranch = getbranchinfo(r)

414

branch, closesbranch = getbranchinfo(r)

409

newbranches.setdefault(branch, []).append(r)

415

newbranches.setdefault(branch, []).append(r)

410

if closesbranch:

416

if closesbranch:

411

self._closednodes.add(cl.node(r))

417

self._closednodes.add(cl.node(r))

412

418

413

# fetch current topological heads to speed up filtering

419

# fetch current topological heads to speed up filtering

414

topoheads = set(cl.headrevs())

420

topoheads = set(cl.headrevs())

415

421

416

# new tip revision which we found after iterating items from new

422

# new tip revision which we found after iterating items from new

417

# branches

423

# branches

418

ntiprev = self.tiprev

424

ntiprev = self.tiprev

419

425

420

# if older branchheads are reachable from new ones, they aren't

426

# if older branchheads are reachable from new ones, they aren't

421

# really branchheads. Note checking parents is insufficient:

427

# really branchheads. Note checking parents is insufficient:

422

# 1 (branch a) -> 2 (branch b) -> 3 (branch a)

428

# 1 (branch a) -> 2 (branch b) -> 3 (branch a)

423

for branch, newheadrevs in pycompat.iteritems(newbranches):

429

for branch, newheadrevs in pycompat.iteritems(newbranches):

424

bheads = self._entries.setdefault(branch, [])

430

bheads = self._entries.setdefault(branch, [])

425

bheadset = set(cl.rev(node) for node in bheads)

431

bheadset = set(cl.rev(node) for node in bheads)

426

432

427

# This have been tested True on all internal usage of this function.

433

# This have been tested True on all internal usage of this function.

428

# run it again in case of doubt

434

# run it again in case of doubt

429

# assert not (set(bheadrevs) & set(newheadrevs))

435

# assert not (set(bheadrevs) & set(newheadrevs))

430

bheadset.update(newheadrevs)

436

bheadset.update(newheadrevs)

431

437

432

# This prunes out two kinds of heads - heads that are superseded by

438

# This prunes out two kinds of heads - heads that are superseded by

433

# a head in newheadrevs, and newheadrevs that are not heads because

439

# a head in newheadrevs, and newheadrevs that are not heads because

434

# an existing head is their descendant.

440

# an existing head is their descendant.

435

uncertain = bheadset - topoheads

441

uncertain = bheadset - topoheads

436

if uncertain:

442

if uncertain:

437

floorrev = min(uncertain)

443

floorrev = min(uncertain)

438

ancestors = set(cl.ancestors(newheadrevs, floorrev))

444

ancestors = set(cl.ancestors(newheadrevs, floorrev))

439

bheadset -= ancestors

445

bheadset -= ancestors

440

bheadrevs = sorted(bheadset)

446

bheadrevs = sorted(bheadset)

441

self[branch] = [cl.node(rev) for rev in bheadrevs]

447

self[branch] = [cl.node(rev) for rev in bheadrevs]

442

tiprev = bheadrevs[-1]

448

tiprev = bheadrevs[-1]

443

if tiprev > ntiprev:

449

if tiprev > ntiprev:

444

ntiprev = tiprev

450

ntiprev = tiprev

445

451

446

if ntiprev > self.tiprev:

452

if ntiprev > self.tiprev:

447

self.tiprev = ntiprev

453

self.tiprev = ntiprev

448

self.tipnode = cl.node(ntiprev)

454

self.tipnode = cl.node(ntiprev)

449

455

450

if not self.validfor(repo):

456

if not self.validfor(repo):

451

# cache key are not valid anymore

457

# cache key are not valid anymore

452

self.tipnode = nullid

458

self.tipnode = nullid

453

self.tiprev = nullrev

459

self.tiprev = nullrev

454

for heads in self.iterheads():

460

for heads in self.iterheads():

455

tiprev = max(cl.rev(node) for node in heads)

461

tiprev = max(cl.rev(node) for node in heads)

456

if tiprev > self.tiprev:

462

if tiprev > self.tiprev:

457

self.tipnode = cl.node(tiprev)

463

self.tipnode = cl.node(tiprev)

458

self.tiprev = tiprev

464

self.tiprev = tiprev

459

self.filteredhash = scmutil.filteredhash(repo, self.tiprev)

465

self.filteredhash = scmutil.filteredhash(repo, self.tiprev)

460

466

461

duration = util.timer() - starttime

467

duration = util.timer() - starttime

462

repo.ui.log(

468

repo.ui.log(

463

b'branchcache',

469

b'branchcache',

464

b'updated %s in %.4f seconds\n',

470

b'updated %s in %.4f seconds\n',

465

_branchcachedesc(repo),

471

_branchcachedesc(repo),

466

duration,

472

duration,

467

)

473

)

468

474

469

self.write(repo)

475

self.write(repo)

470

476

471

477

472

class remotebranchcache(branchcache):

478

class remotebranchcache(branchcache):

473

"""Branchmap info for a remote connection, should not write locally"""

479

"""Branchmap info for a remote connection, should not write locally"""

474

480

475

def write(self, repo):

481

def write(self, repo):

476

pass

482

pass

477

483

478

484

479

# Revision branch info cache

485

# Revision branch info cache

480

486

481

_rbcversion = b'-v1'

487

_rbcversion = b'-v1'

482

_rbcnames = b'rbc-names' + _rbcversion

488

_rbcnames = b'rbc-names' + _rbcversion

483

_rbcrevs = b'rbc-revs' + _rbcversion

489

_rbcrevs = b'rbc-revs' + _rbcversion

484

# [4 byte hash prefix][4 byte branch name number with sign bit indicating open]

490

# [4 byte hash prefix][4 byte branch name number with sign bit indicating open]

485

_rbcrecfmt = b'>4sI'

491

_rbcrecfmt = b'>4sI'

486

_rbcrecsize = calcsize(_rbcrecfmt)

492

_rbcrecsize = calcsize(_rbcrecfmt)

487

_rbcnodelen = 4

493

_rbcnodelen = 4

488

_rbcbranchidxmask = 0x7FFFFFFF

494

_rbcbranchidxmask = 0x7FFFFFFF

489

_rbccloseflag = 0x80000000

495

_rbccloseflag = 0x80000000

490

496

491

497

492

class revbranchcache(object):

498

class revbranchcache(object):

493

"""Persistent cache, mapping from revision number to branch name and close.

499

"""Persistent cache, mapping from revision number to branch name and close.

494

This is a low level cache, independent of filtering.

500

This is a low level cache, independent of filtering.

495

501

496

Branch names are stored in rbc-names in internal encoding separated by 0.

502

Branch names are stored in rbc-names in internal encoding separated by 0.

497

rbc-names is append-only, and each branch name is only stored once and will

503

rbc-names is append-only, and each branch name is only stored once and will

498

thus have a unique index.

504

thus have a unique index.

499

505

500

The branch info for each revision is stored in rbc-revs as constant size

506

The branch info for each revision is stored in rbc-revs as constant size

501

records. The whole file is read into memory, but it is only 'parsed' on

507

records. The whole file is read into memory, but it is only 'parsed' on

502

demand. The file is usually append-only but will be truncated if repo

508

demand. The file is usually append-only but will be truncated if repo

503

modification is detected.

509

modification is detected.

504

The record for each revision contains the first 4 bytes of the

510

The record for each revision contains the first 4 bytes of the

505

corresponding node hash, and the record is only used if it still matches.

511

corresponding node hash, and the record is only used if it still matches.

506

Even a completely trashed rbc-revs fill thus still give the right result

512

Even a completely trashed rbc-revs fill thus still give the right result

507

while converging towards full recovery ... assuming no incorrectly matching

513

while converging towards full recovery ... assuming no incorrectly matching

508

node hashes.

514

node hashes.

509

The record also contains 4 bytes where 31 bits contains the index of the

515

The record also contains 4 bytes where 31 bits contains the index of the

510

branch and the last bit indicate that it is a branch close commit.

516

branch and the last bit indicate that it is a branch close commit.

511

The usage pattern for rbc-revs is thus somewhat similar to 00changelog.i

517

The usage pattern for rbc-revs is thus somewhat similar to 00changelog.i

512

and will grow with it but be 1/8th of its size.

518

and will grow with it but be 1/8th of its size.

513

"""

519

"""

514

520

515

def __init__(self, repo, readonly=True):

521

def __init__(self, repo, readonly=True):

516

assert repo.filtername is None

522

assert repo.filtername is None

517

self._repo = repo

523

self._repo = repo

518

self._names = [] # branch names in local encoding with static index

524

self._names = [] # branch names in local encoding with static index

519

self._rbcrevs = bytearray()

525

self._rbcrevs = bytearray()

520

self._rbcsnameslen = 0 # length of names read at _rbcsnameslen

526

self._rbcsnameslen = 0 # length of names read at _rbcsnameslen

521

try:

527

try:

522

bndata = repo.cachevfs.read(_rbcnames)

528

bndata = repo.cachevfs.read(_rbcnames)

523

self._rbcsnameslen = len(bndata) # for verification before writing

529

self._rbcsnameslen = len(bndata) # for verification before writing

524

if bndata:

530

if bndata:

525

self._names = [

531

self._names = [

526

encoding.tolocal(bn) for bn in bndata.split(b'\0')

532

encoding.tolocal(bn) for bn in bndata.split(b'\0')

527

]

533

]

528

except (IOError, OSError):

534

except (IOError, OSError):

529

if readonly:

535

if readonly:

530

# don't try to use cache - fall back to the slow path

536

# don't try to use cache - fall back to the slow path

531

self.branchinfo = self._branchinfo

537

self.branchinfo = self._branchinfo

532

538

533

if self._names:

539

if self._names:

534

try:

540

try:

535

data = repo.cachevfs.read(_rbcrevs)

541

data = repo.cachevfs.read(_rbcrevs)

536

self._rbcrevs[:] = data

542

self._rbcrevs[:] = data

537

except (IOError, OSError) as inst:

543

except (IOError, OSError) as inst:

538

repo.ui.debug(

544

repo.ui.debug(

539

b"couldn't read revision branch cache: %s\n"

545

b"couldn't read revision branch cache: %s\n"

540

% stringutil.forcebytestr(inst)

546

% stringutil.forcebytestr(inst)

541

)

547

)

542

# remember number of good records on disk

548

# remember number of good records on disk

543

self._rbcrevslen = min(

549

self._rbcrevslen = min(

544

len(self._rbcrevs) // _rbcrecsize, len(repo.changelog)

550

len(self._rbcrevs) // _rbcrecsize, len(repo.changelog)

545

)

551

)

546

if self._rbcrevslen == 0:

552

if self._rbcrevslen == 0:

547

self._names = []

553

self._names = []

548

self._rbcnamescount = len(self._names) # number of names read at

554

self._rbcnamescount = len(self._names) # number of names read at

549

# _rbcsnameslen

555

# _rbcsnameslen

550

556

551

def _clear(self):

557

def _clear(self):

552

self._rbcsnameslen = 0

558

self._rbcsnameslen = 0

553

del self._names[:]

559

del self._names[:]

554

self._rbcnamescount = 0

560

self._rbcnamescount = 0

555

self._rbcrevslen = len(self._repo.changelog)

561

self._rbcrevslen = len(self._repo.changelog)

556

self._rbcrevs = bytearray(self._rbcrevslen * _rbcrecsize)

562

self._rbcrevs = bytearray(self._rbcrevslen * _rbcrecsize)

557

util.clearcachedproperty(self, b'_namesreverse')

563

util.clearcachedproperty(self, b'_namesreverse')

558

564

559

@util.propertycache

565

@util.propertycache

560

def _namesreverse(self):

566

def _namesreverse(self):

561

return dict((b, r) for r, b in enumerate(self._names))

567

return dict((b, r) for r, b in enumerate(self._names))

562

568

563

def branchinfo(self, rev):

569

def branchinfo(self, rev):

564

"""Return branch name and close flag for rev, using and updating

570

"""Return branch name and close flag for rev, using and updating

565

persistent cache."""

571

persistent cache."""

566

changelog = self._repo.changelog

572

changelog = self._repo.changelog

567

rbcrevidx = rev * _rbcrecsize

573

rbcrevidx = rev * _rbcrecsize

568

574

569

# avoid negative index, changelog.read(nullrev) is fast without cache

575

# avoid negative index, changelog.read(nullrev) is fast without cache

570

if rev == nullrev:

576

if rev == nullrev:

571

return changelog.branchinfo(rev)

577

return changelog.branchinfo(rev)

572

578

573

# if requested rev isn't allocated, grow and cache the rev info

579

# if requested rev isn't allocated, grow and cache the rev info

574

if len(self._rbcrevs) < rbcrevidx + _rbcrecsize:

580

if len(self._rbcrevs) < rbcrevidx + _rbcrecsize:

575

return self._branchinfo(rev)

581

return self._branchinfo(rev)

576

582

577

# fast path: extract data from cache, use it if node is matching

583

# fast path: extract data from cache, use it if node is matching

578

reponode = changelog.node(rev)[:_rbcnodelen]

584

reponode = changelog.node(rev)[:_rbcnodelen]

579

cachenode, branchidx = unpack_from(

585

cachenode, branchidx = unpack_from(

580

_rbcrecfmt, util.buffer(self._rbcrevs), rbcrevidx

586

_rbcrecfmt, util.buffer(self._rbcrevs), rbcrevidx

581

)

587

)

582

close = bool(branchidx & _rbccloseflag)

588

close = bool(branchidx & _rbccloseflag)

583

if close:

589

if close:

584

branchidx &= _rbcbranchidxmask

590

branchidx &= _rbcbranchidxmask

585

if cachenode == b'\0\0\0\0':

591

if cachenode == b'\0\0\0\0':

586

pass

592

pass

587

elif cachenode == reponode:

593

elif cachenode == reponode:

588

try:

594

try:

589

return self._names[branchidx], close

595

return self._names[branchidx], close

590

except IndexError:

596

except IndexError:

591

# recover from invalid reference to unknown branch

597

# recover from invalid reference to unknown branch

592

self._repo.ui.debug(

598

self._repo.ui.debug(

593

b"referenced branch names not found"

599

b"referenced branch names not found"

594

b" - rebuilding revision branch cache from scratch\n"

600

b" - rebuilding revision branch cache from scratch\n"

595

)

601

)

596

self._clear()

602

self._clear()

597

else:

603

else:

598

# rev/node map has changed, invalidate the cache from here up

604

# rev/node map has changed, invalidate the cache from here up

599

self._repo.ui.debug(

605

self._repo.ui.debug(

600

b"history modification detected - truncating "

606

b"history modification detected - truncating "

601

b"revision branch cache to revision %d\n" % rev

607

b"revision branch cache to revision %d\n" % rev

602

)

608

)

603

truncate = rbcrevidx + _rbcrecsize

609

truncate = rbcrevidx + _rbcrecsize

604

del self._rbcrevs[truncate:]

610

del self._rbcrevs[truncate:]

605

self._rbcrevslen = min(self._rbcrevslen, truncate)

611

self._rbcrevslen = min(self._rbcrevslen, truncate)

606

612

607

# fall back to slow path and make sure it will be written to disk

613

# fall back to slow path and make sure it will be written to disk

608

return self._branchinfo(rev)

614

return self._branchinfo(rev)

609

615

610

def _branchinfo(self, rev):

616

def _branchinfo(self, rev):

611

"""Retrieve branch info from changelog and update _rbcrevs"""

617

"""Retrieve branch info from changelog and update _rbcrevs"""

612

changelog = self._repo.changelog

618

changelog = self._repo.changelog

613

b, close = changelog.branchinfo(rev)

619

b, close = changelog.branchinfo(rev)

614

if b in self._namesreverse:

620

if b in self._namesreverse:

615

branchidx = self._namesreverse[b]

621

branchidx = self._namesreverse[b]

616

else:

622

else:

617

branchidx = len(self._names)

623

branchidx = len(self._names)

618

self._names.append(b)

624

self._names.append(b)

619

self._namesreverse[b] = branchidx

625

self._namesreverse[b] = branchidx

620

reponode = changelog.node(rev)

626

reponode = changelog.node(rev)

621

if close:

627

if close:

622

branchidx |= _rbccloseflag

628

branchidx |= _rbccloseflag

623

self._setcachedata(rev, reponode, branchidx)

629

self._setcachedata(rev, reponode, branchidx)

624

return b, close

630

return b, close

625

631

626

def setdata(self, branch, rev, node, close):

632

def setdata(self, branch, rev, node, close):

627

"""add new data information to the cache"""

633

"""add new data information to the cache"""

628

if branch in self._namesreverse:

634

if branch in self._namesreverse:

629

branchidx = self._namesreverse[branch]

635

branchidx = self._namesreverse[branch]

630

else:

636

else:

631

branchidx = len(self._names)

637

branchidx = len(self._names)

632

self._names.append(branch)

638

self._names.append(branch)

633

self._namesreverse[branch] = branchidx

639

self._namesreverse[branch] = branchidx

634

if close:

640

if close:

635

branchidx |= _rbccloseflag

641

branchidx |= _rbccloseflag

636

self._setcachedata(rev, node, branchidx)

642

self._setcachedata(rev, node, branchidx)

637

# If no cache data were readable (non exists, bad permission, etc)

643

# If no cache data were readable (non exists, bad permission, etc)

638

# the cache was bypassing itself by setting:

644

# the cache was bypassing itself by setting:

639

#

645

#

640

# self.branchinfo = self._branchinfo

646

# self.branchinfo = self._branchinfo

641

#

647

#

642

# Since we now have data in the cache, we need to drop this bypassing.

648

# Since we now have data in the cache, we need to drop this bypassing.

643

if r'branchinfo' in vars(self):

649

if r'branchinfo' in vars(self):

644

del self.branchinfo

650

del self.branchinfo

645

651

646

def _setcachedata(self, rev, node, branchidx):

652

def _setcachedata(self, rev, node, branchidx):

647

"""Writes the node's branch data to the in-memory cache data."""

653

"""Writes the node's branch data to the in-memory cache data."""

648

if rev == nullrev:

654

if rev == nullrev:

649

return

655

return

650

rbcrevidx = rev * _rbcrecsize

656

rbcrevidx = rev * _rbcrecsize

651

if len(self._rbcrevs) < rbcrevidx + _rbcrecsize:

657

if len(self._rbcrevs) < rbcrevidx + _rbcrecsize:

652

self._rbcrevs.extend(

658

self._rbcrevs.extend(

653

b'\0'

659

b'\0'

654

* (len(self._repo.changelog) * _rbcrecsize - len(self._rbcrevs))

660

* (len(self._repo.changelog) * _rbcrecsize - len(self._rbcrevs))

655

)

661

)

656

pack_into(_rbcrecfmt, self._rbcrevs, rbcrevidx, node, branchidx)

662

pack_into(_rbcrecfmt, self._rbcrevs, rbcrevidx, node, branchidx)

657

self._rbcrevslen = min(self._rbcrevslen, rev)

663

self._rbcrevslen = min(self._rbcrevslen, rev)

658

664

659

tr = self._repo.currenttransaction()

665

tr = self._repo.currenttransaction()

660

if tr:

666

if tr:

661

tr.addfinalize(b'write-revbranchcache', self.write)

667

tr.addfinalize(b'write-revbranchcache', self.write)

662

668

663

def write(self, tr=None):

669

def write(self, tr=None):

664

"""Save branch cache if it is dirty."""

670

"""Save branch cache if it is dirty."""

665

repo = self._repo

671

repo = self._repo

666

wlock = None

672

wlock = None

667

step = b''

673

step = b''

668

try:

674

try:

669

# write the new names

675

# write the new names

670

if self._rbcnamescount < len(self._names):

676

if self._rbcnamescount < len(self._names):

671

wlock = repo.wlock(wait=False)

677

wlock = repo.wlock(wait=False)

672

step = b' names'

678

step = b' names'

673

self._writenames(repo)

679

self._writenames(repo)

674

680

675

# write the new revs

681

# write the new revs

676

start = self._rbcrevslen * _rbcrecsize

682

start = self._rbcrevslen * _rbcrecsize

677

if start != len(self._rbcrevs):

683

if start != len(self._rbcrevs):

678

step = b''

684

step = b''

679

if wlock is None:

685

if wlock is None:

680

wlock = repo.wlock(wait=False)

686

wlock = repo.wlock(wait=False)

681

self._writerevs(repo, start)

687

self._writerevs(repo, start)

682

688

683

except (IOError, OSError, error.Abort, error.LockError) as inst:

689

except (IOError, OSError, error.Abort, error.LockError) as inst:

684

repo.ui.debug(

690

repo.ui.debug(

685

b"couldn't write revision branch cache%s: %s\n"

691

b"couldn't write revision branch cache%s: %s\n"

686

% (step, stringutil.forcebytestr(inst))

692

% (step, stringutil.forcebytestr(inst))

687

)

693

)

688

finally:

694

finally:

689

if wlock is not None:

695

if wlock is not None:

690

wlock.release()

696

wlock.release()

691

697

692

def _writenames(self, repo):

698

def _writenames(self, repo):

693

""" write the new branch names to revbranchcache """

699

""" write the new branch names to revbranchcache """

694

if self._rbcnamescount != 0:

700

if self._rbcnamescount != 0:

695

f = repo.cachevfs.open(_rbcnames, b'ab')

701

f = repo.cachevfs.open(_rbcnames, b'ab')

696

if f.tell() == self._rbcsnameslen:

702

if f.tell() == self._rbcsnameslen:

697

f.write(b'\0')

703

f.write(b'\0')

698

else:

704

else:

699

f.close()

705

f.close()

700

repo.ui.debug(b"%s changed - rewriting it\n" % _rbcnames)

706

repo.ui.debug(b"%s changed - rewriting it\n" % _rbcnames)

701

self._rbcnamescount = 0

707

self._rbcnamescount = 0

702

self._rbcrevslen = 0

708

self._rbcrevslen = 0

703

if self._rbcnamescount == 0:

709

if self._rbcnamescount == 0:

704

# before rewriting names, make sure references are removed

710

# before rewriting names, make sure references are removed

705

repo.cachevfs.unlinkpath(_rbcrevs, ignoremissing=True)

711

repo.cachevfs.unlinkpath(_rbcrevs, ignoremissing=True)

706

f = repo.cachevfs.open(_rbcnames, b'wb')

712

f = repo.cachevfs.open(_rbcnames, b'wb')

707

f.write(

713

f.write(

708

b'\0'.join(

714

b'\0'.join(

709

encoding.fromlocal(b)

715

encoding.fromlocal(b)

710

for b in self._names[self._rbcnamescount :]

716

for b in self._names[self._rbcnamescount :]

711

)

717

)

712

)

718

)

713

self._rbcsnameslen = f.tell()

719

self._rbcsnameslen = f.tell()

714

f.close()

720

f.close()

715

self._rbcnamescount = len(self._names)

721

self._rbcnamescount = len(self._names)

716

722

717

def _writerevs(self, repo, start):

723

def _writerevs(self, repo, start):

718

""" write the new revs to revbranchcache """

724

""" write the new revs to revbranchcache """

719

revs = min(len(repo.changelog), len(self._rbcrevs) // _rbcrecsize)

725

revs = min(len(repo.changelog), len(self._rbcrevs) // _rbcrecsize)

720

with repo.cachevfs.open(_rbcrevs, b'ab') as f:

726

with repo.cachevfs.open(_rbcrevs, b'ab') as f:

721

if f.tell() != start:

727

if f.tell() != start:

722

repo.ui.debug(

728

repo.ui.debug(

723

b"truncating cache/%s to %d\n" % (_rbcrevs, start)

729

b"truncating cache/%s to %d\n" % (_rbcrevs, start)

724

)

730

)

725

f.seek(start)

731

f.seek(start)

726

if f.tell() != start:

732

if f.tell() != start:

727

start = 0

733

start = 0

728

f.seek(start)

734

f.seek(start)

729

f.truncate()

735

f.truncate()

730

end = revs * _rbcrecsize

736

end = revs * _rbcrecsize

731

f.write(self._rbcrevs[start:end])

737

f.write(self._rbcrevs[start:end])

732

self._rbcrevslen = revs

738

self._rbcrevslen = revs

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # branchmap.py - logic to computes, maintain and stores branchmap for local repo
             #
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import struct
             from .node import (
                 bin,
                 hex,
                 nullid,
                 nullrev,
             )
             from . import (
                 encoding,
                 error,
                 pycompat,
                 scmutil,
                 util,
             )
             from .utils import (
                 repoviewutil,
                 stringutil,
             )
             subsettable = repoviewutil.subsettable
             calcsize = struct.calcsize
             pack_into = struct.pack_into
             unpack_from = struct.unpack_from
             class BranchMapCache(object):
                 """mapping of filtered views of repo with their branchcache"""
                 def __init__(self):
                     self._per_filter = {}
                 def __getitem__(self, repo):
                     self.updatecache(repo)
                     return self._per_filter[repo.filtername]
                 def updatecache(self, repo):
                     """Update the cache for the given filtered view on a repository"""
                     # This can trigger updates for the caches for subsets of the filtered
                     # view, e.g. when there is no cache for this filtered view or the cache
                     # is stale.
                     cl = repo.changelog
                     filtername = repo.filtername
                     bcache = self._per_filter.get(filtername)
                     if bcache is None or not bcache.validfor(repo):
                         # cache object missing or cache object stale? Read from disk
                         bcache = branchcache.fromfile(repo)
                     revs = []
                     if bcache is None:
                         # no (fresh) cache available anymore, perhaps we can re-use
                         # the cache for a subset, then extend that to add info on missing
                         # revisions.
                         subsetname = subsettable.get(filtername)
                         if subsetname is not None:
                             subset = repo.filtered(subsetname)
                             bcache = self[subset].copy()
                             extrarevs = subset.changelog.filteredrevs - cl.filteredrevs
                             revs.extend(r for r in extrarevs if r <= bcache.tiprev)
                         else:
                             # nothing to fall back on, start empty.
                             bcache = branchcache()
                     revs.extend(cl.revs(start=bcache.tiprev + 1))
                     if revs:
                         bcache.update(repo, revs)
                     assert bcache.validfor(repo), filtername
                     self._per_filter[repo.filtername] = bcache
                 def replace(self, repo, remotebranchmap):
                     """Replace the branchmap cache for a repo with a branch mapping.
                     This is likely only called during clone with a branch map from a
                     remote.
                     """
                     cl = repo.changelog
                     clrev = cl.rev
                     clbranchinfo = cl.branchinfo
                     rbheads = []
                     closed = []
                     for bheads in pycompat.itervalues(remotebranchmap):
                         rbheads += bheads
                         for h in bheads:
                             r = clrev(h)
                             b, c = clbranchinfo(r)
                             if c:
                                 closed.append(h)
                     if rbheads:
                         rtiprev = max((int(clrev(node)) for node in rbheads))
                         cache = branchcache(
                             remotebranchmap,
                             repo[rtiprev].node(),
                             rtiprev,
                             closednodes=closed,
                         )
                         # Try to stick it as low as possible
                         # filter above served are unlikely to be fetch from a clone
                         for candidate in (b'base', b'immutable', b'served'):
                             rview = repo.filtered(candidate)
                             if cache.validfor(rview):
                                 self._per_filter[candidate] = cache
                                 cache.write(rview)
                                 return
                 def clear(self):
                     self._per_filter.clear()
             def _unknownnode(node):
                 """ raises ValueError when branchcache found a node which does not exists
                 """
                 raise ValueError(r'node %s does not exist' % pycompat.sysstr(hex(node)))
             def _branchcachedesc(repo):
                 if repo.filtername is not None:
                     return b'branch cache (%s)' % repo.filtername
                 else:
                     return b'branch cache'
             class branchcache(object):
                 """A dict like object that hold branches heads cache.
                 This cache is used to avoid costly computations to determine all the
                 branch heads of a repo.
                 The cache is serialized on disk in the following format:
                 <tip hex node> <tip rev number> [optional filtered repo hex hash]
                 <branch head hex node> <open/closed state> <branch name>
                 <branch head hex node> <open/closed state> <branch name>
                 ...
                 The first line is used to check if the cache is still valid. If the
                 branch cache is for a filtered repo view, an optional third hash is
                 included that hashes the hashes of all filtered revisions.
                 The open/closed state is represented by a single letter 'o' or 'c'.
                 This field can be used to avoid changelog reads when determining if a
                 branch head closes a branch or not.
                 """
                 def __init__(
                     self,
                     entries=(),
                     tipnode=nullid,
                     tiprev=nullrev,
                     filteredhash=None,
                     closednodes=None,
                     hasnode=None,
                 ):
                     """ hasnode is a function which can be used to verify whether changelog
                     has a given node or not. If it's not provided, we assume that every node
                     we have exists in changelog """
                     self.tipnode = tipnode
                     self.tiprev = tiprev
                     self.filteredhash = filteredhash
                     # closednodes is a set of nodes that close their branch. If the branch
                     # cache has been updated, it may contain nodes that are no longer
                     # heads.
                     if closednodes is None:
                         self._closednodes = set()
                     else:
                         self._closednodes = closednodes
                     self._entries = dict(entries)
                     # whether closed nodes are verified or not
                     self._closedverified = False
                     # branches for which nodes are verified
                     self._verifiedbranches = set()
                     self._hasnode = hasnode
                     if self._hasnode is None:
                         self._hasnode = lambda x: True
                 def _verifyclosed(self):
                     """ verify the closed nodes we have """
                     if self._closedverified:
                         return
                     for node in self._closednodes:
                         if not self._hasnode(node):
                             _unknownnode(node)
                     self._closedverified = True
                 def _verifybranch(self, branch):
                     """ verify head nodes for the given branch. """
                     if branch not in self._entries or branch in self._verifiedbranches:
                         return
                     for n in self._entries[branch]:
                         if not self._hasnode(n):
                             _unknownnode(n)
                     self._verifiedbranches.add(branch)
                 def _verifyall(self):
                     """ verifies nodes of all the branches """
                     needverification = set(self._entries.keys()) - self._verifiedbranches
                     for b in needverification:
                         self._verifybranch(b)
                 def __iter__(self):
                     return iter(self._entries)
                 def __setitem__(self, key, value):
                     self._entries[key] = value
                 def __getitem__(self, key):
                     self._verifybranch(key)
                     return self._entries[key]
                 def __contains__(self, key):
                     self._verifybranch(key)
                     return key in self._entries
                 def iteritems(self):
                     for k, v in pycompat.iteritems(self._entries):
                         self._verifybranch(k)
                         yield k, v
                 items = iteritems
                 def hasbranch(self, label):
                     """ checks whether a branch of this name exists or not """
                     self._verifybranch(label)
                     return label in self._entries
                 @classmethod
                 def fromfile(cls, repo):
                     f = None
                     try:
                         f = repo.cachevfs(cls._filename(repo))
                         lineiter = iter(f)
                         cachekey = next(lineiter).rstrip(b'\n').split(b" ", 2)
                         last, lrev = cachekey[:2]
                         last, lrev = bin(last), int(lrev)
                         filteredhash = None
                         hasnode = repo.changelog.hasnode
                         if len(cachekey) > 2:
                             filteredhash = bin(cachekey[2])
                         bcache = cls(
                             tipnode=last,
                             tiprev=lrev,
                             filteredhash=filteredhash,
                             hasnode=hasnode,
                         )
                         if not bcache.validfor(repo):
                             # invalidate the cache
                             raise ValueError(r'tip differs')
                         bcache.load(repo, lineiter)
                     except (IOError, OSError):
                         return None
                     except Exception as inst:
                         if repo.ui.debugflag:
                             msg = b'invalid %s: %s\n'
                             repo.ui.debug(
-                                msg % (_branchcachedesc(repo), pycompat.bytestr(inst))
+                                msg
+                                % (
+                                    _branchcachedesc(repo),
+                                    pycompat.bytestr(
+                                        inst  # pytype: disable=wrong-arg-types
+                                    ),
+                                )
                             )
                         bcache = None
                     finally:
                         if f:
                             f.close()
                     return bcache
                 def load(self, repo, lineiter):
                     """ fully loads the branchcache by reading from the file using the line
                     iterator passed"""
                     for line in lineiter:
                         line = line.rstrip(b'\n')
                         if not line:
                             continue
                         node, state, label = line.split(b" ", 2)
                         if state not in b'oc':
                             raise ValueError(r'invalid branch state')
                         label = encoding.tolocal(label.strip())
                         node = bin(node)
                         self._entries.setdefault(label, []).append(node)
                         if state == b'c':
                             self._closednodes.add(node)
                 @staticmethod
                 def _filename(repo):
                     """name of a branchcache file for a given repo or repoview"""
                     filename = b"branch2"
                     if repo.filtername:
                         filename = b'%s-%s' % (filename, repo.filtername)
                     return filename
                 def validfor(self, repo):
                     """Is the cache content valid regarding a repo
                     - False when cached tipnode is unknown or if we detect a strip.
                     - True when cache is up to date or a subset of current repo."""
                     try:
                         return (self.tipnode == repo.changelog.node(self.tiprev)) and (
                             self.filteredhash == scmutil.filteredhash(repo, self.tiprev)
                         )
                     except IndexError:
                         return False
                 def _branchtip(self, heads):
                     '''Return tuple with last open head in heads and false,
                     otherwise return last closed head and true.'''
                     tip = heads[-1]
                     closed = True
                     for h in reversed(heads):
                         if h not in self._closednodes:
                             tip = h
                             closed = False
                             break
                     return tip, closed
                 def branchtip(self, branch):
                     '''Return the tipmost open head on branch head, otherwise return the
                     tipmost closed head on branch.
                     Raise KeyError for unknown branch.'''
                     return self._branchtip(self[branch])[0]
                 def iteropen(self, nodes):
                     return (n for n in nodes if n not in self._closednodes)
                 def branchheads(self, branch, closed=False):
                     self._verifybranch(branch)
                     heads = self._entries[branch]
                     if not closed:
                         heads = list(self.iteropen(heads))
                     return heads
                 def iterbranches(self):
                     for bn, heads in pycompat.iteritems(self):
                         yield (bn, heads) + self._branchtip(heads)
                 def iterheads(self):
                     """ returns all the heads """
                     self._verifyall()
                     return pycompat.itervalues(self._entries)
                 def copy(self):
                     """return an deep copy of the branchcache object"""
                     return type(self)(
                         self._entries,
                         self.tipnode,
                         self.tiprev,
                         self.filteredhash,
                         self._closednodes,
                     )
                 def write(self, repo):
                     try:
                         f = repo.cachevfs(self._filename(repo), b"w", atomictemp=True)
                         cachekey = [hex(self.tipnode), b'%d' % self.tiprev]
                         if self.filteredhash is not None:
                             cachekey.append(hex(self.filteredhash))
                         f.write(b" ".join(cachekey) + b'\n')
                         nodecount = 0
                         for label, nodes in sorted(pycompat.iteritems(self._entries)):
                             label = encoding.fromlocal(label)
                             for node in nodes:
                                 nodecount += 1
                                 if node in self._closednodes:
                                     state = b'c'
                                 else:
                                     state = b'o'
                                 f.write(b"%s %s %s\n" % (hex(node), state, label))
                         f.close()
                         repo.ui.log(
                             b'branchcache',
                             b'wrote %s with %d labels and %d nodes\n',
                             _branchcachedesc(repo),
                             len(self._entries),
                             nodecount,
                         )
                     except (IOError, OSError, error.Abort) as inst:
                         # Abort may be raised by read only opener, so log and continue
                         repo.ui.debug(
                             b"couldn't write branch cache: %s\n"
                             % stringutil.forcebytestr(inst)
                         )
                 def update(self, repo, revgen):
                     """Given a branchhead cache, self, that may have extra nodes or be
                     missing heads, and a generator of nodes that are strictly a superset of
                     heads missing, this function updates self to be correct.
                     """
                     starttime = util.timer()
                     cl = repo.changelog
                     # collect new branch entries
                     newbranches = {}
                     getbranchinfo = repo.revbranchcache().branchinfo
                     for r in revgen:
                         branch, closesbranch = getbranchinfo(r)
                         newbranches.setdefault(branch, []).append(r)
                         if closesbranch:
                             self._closednodes.add(cl.node(r))
                     # fetch current topological heads to speed up filtering
                     topoheads = set(cl.headrevs())
                     # new tip revision which we found after iterating items from new
                     # branches
                     ntiprev = self.tiprev
                     # if older branchheads are reachable from new ones, they aren't
                     # really branchheads. Note checking parents is insufficient:
                     # 1 (branch a) -> 2 (branch b) -> 3 (branch a)
                     for branch, newheadrevs in pycompat.iteritems(newbranches):
                         bheads = self._entries.setdefault(branch, [])
                         bheadset = set(cl.rev(node) for node in bheads)
                         # This have been tested True on all internal usage of this function.
                         # run it again in case of doubt
                         # assert not (set(bheadrevs) & set(newheadrevs))
                         bheadset.update(newheadrevs)
                         # This prunes out two kinds of heads - heads that are superseded by
                         # a head in newheadrevs, and newheadrevs that are not heads because
                         # an existing head is their descendant.
                         uncertain = bheadset - topoheads
                         if uncertain:
                             floorrev = min(uncertain)
                             ancestors = set(cl.ancestors(newheadrevs, floorrev))
                             bheadset -= ancestors
                         bheadrevs = sorted(bheadset)
                         self[branch] = [cl.node(rev) for rev in bheadrevs]
                         tiprev = bheadrevs[-1]
                         if tiprev > ntiprev:
                             ntiprev = tiprev
                     if ntiprev > self.tiprev:
                         self.tiprev = ntiprev
                         self.tipnode = cl.node(ntiprev)
                     if not self.validfor(repo):
                         # cache key are not valid anymore
                         self.tipnode = nullid
                         self.tiprev = nullrev
                         for heads in self.iterheads():
                             tiprev = max(cl.rev(node) for node in heads)
                             if tiprev > self.tiprev:
                                 self.tipnode = cl.node(tiprev)
                                 self.tiprev = tiprev
                     self.filteredhash = scmutil.filteredhash(repo, self.tiprev)
                     duration = util.timer() - starttime
                     repo.ui.log(
                         b'branchcache',
                         b'updated %s in %.4f seconds\n',
                         _branchcachedesc(repo),
                         duration,
                     )
                     self.write(repo)
             class remotebranchcache(branchcache):
                 """Branchmap info for a remote connection, should not write locally"""
                 def write(self, repo):
                     pass
             # Revision branch info cache
             _rbcversion = b'-v1'
             _rbcnames = b'rbc-names' + _rbcversion
             _rbcrevs = b'rbc-revs' + _rbcversion
             # [4 byte hash prefix][4 byte branch name number with sign bit indicating open]
             _rbcrecfmt = b'>4sI'
             _rbcrecsize = calcsize(_rbcrecfmt)
             _rbcnodelen = 4
             _rbcbranchidxmask = 0x7FFFFFFF
             _rbccloseflag = 0x80000000
             class revbranchcache(object):
                 """Persistent cache, mapping from revision number to branch name and close.
                 This is a low level cache, independent of filtering.
                 Branch names are stored in rbc-names in internal encoding separated by 0.
                 rbc-names is append-only, and each branch name is only stored once and will
                 thus have a unique index.
                 The branch info for each revision is stored in rbc-revs as constant size
                 records. The whole file is read into memory, but it is only 'parsed' on
                 demand. The file is usually append-only but will be truncated if repo
                 modification is detected.
                 The record for each revision contains the first 4 bytes of the
                 corresponding node hash, and the record is only used if it still matches.
                 Even a completely trashed rbc-revs fill thus still give the right result
                 while converging towards full recovery ... assuming no incorrectly matching
                 node hashes.
                 The record also contains 4 bytes where 31 bits contains the index of the
                 branch and the last bit indicate that it is a branch close commit.
                 The usage pattern for rbc-revs is thus somewhat similar to 00changelog.i
                 and will grow with it but be 1/8th of its size.
                 """
                 def __init__(self, repo, readonly=True):
                     assert repo.filtername is None
                     self._repo = repo
                     self._names = []  # branch names in local encoding with static index
                     self._rbcrevs = bytearray()
                     self._rbcsnameslen = 0  # length of names read at _rbcsnameslen
                     try:
                         bndata = repo.cachevfs.read(_rbcnames)
                         self._rbcsnameslen = len(bndata)  # for verification before writing
                         if bndata:
                             self._names = [
                                 encoding.tolocal(bn) for bn in bndata.split(b'\0')
                             ]
                     except (IOError, OSError):
                         if readonly:
                             # don't try to use cache - fall back to the slow path
                             self.branchinfo = self._branchinfo
                     if self._names:
                         try:
                             data = repo.cachevfs.read(_rbcrevs)
                             self._rbcrevs[:] = data
                         except (IOError, OSError) as inst:
                             repo.ui.debug(
                                 b"couldn't read revision branch cache: %s\n"
                                 % stringutil.forcebytestr(inst)
                             )
                     # remember number of good records on disk
                     self._rbcrevslen = min(
                         len(self._rbcrevs) // _rbcrecsize, len(repo.changelog)
                     )
                     if self._rbcrevslen == 0:
                         self._names = []
                     self._rbcnamescount = len(self._names)  # number of names read at
                     # _rbcsnameslen
                 def _clear(self):
                     self._rbcsnameslen = 0
                     del self._names[:]
                     self._rbcnamescount = 0
                     self._rbcrevslen = len(self._repo.changelog)
                     self._rbcrevs = bytearray(self._rbcrevslen * _rbcrecsize)
                     util.clearcachedproperty(self, b'_namesreverse')
                 @util.propertycache
                 def _namesreverse(self):
                     return dict((b, r) for r, b in enumerate(self._names))
                 def branchinfo(self, rev):
                     """Return branch name and close flag for rev, using and updating
                     persistent cache."""
                     changelog = self._repo.changelog
                     rbcrevidx = rev * _rbcrecsize
                     # avoid negative index, changelog.read(nullrev) is fast without cache
                     if rev == nullrev:
                         return changelog.branchinfo(rev)
                     # if requested rev isn't allocated, grow and cache the rev info
                     if len(self._rbcrevs) < rbcrevidx + _rbcrecsize:
                         return self._branchinfo(rev)
                     # fast path: extract data from cache, use it if node is matching
                     reponode = changelog.node(rev)[:_rbcnodelen]
                     cachenode, branchidx = unpack_from(
                         _rbcrecfmt, util.buffer(self._rbcrevs), rbcrevidx
                     )
                     close = bool(branchidx & _rbccloseflag)
                     if close:
                         branchidx &= _rbcbranchidxmask
                     if cachenode == b'\0\0\0\0':
                         pass
                     elif cachenode == reponode:
                         try:
                             return self._names[branchidx], close
                         except IndexError:
                             # recover from invalid reference to unknown branch
                             self._repo.ui.debug(
                                 b"referenced branch names not found"
                                 b" - rebuilding revision branch cache from scratch\n"
                             )
                             self._clear()
                     else:
                         # rev/node map has changed, invalidate the cache from here up
                         self._repo.ui.debug(
                             b"history modification detected - truncating "
                             b"revision branch cache to revision %d\n" % rev
                         )
                         truncate = rbcrevidx + _rbcrecsize
                         del self._rbcrevs[truncate:]
                         self._rbcrevslen = min(self._rbcrevslen, truncate)
                     # fall back to slow path and make sure it will be written to disk
                     return self._branchinfo(rev)
                 def _branchinfo(self, rev):
                     """Retrieve branch info from changelog and update _rbcrevs"""
                     changelog = self._repo.changelog
                     b, close = changelog.branchinfo(rev)
                     if b in self._namesreverse:
                         branchidx = self._namesreverse[b]
                     else:
                         branchidx = len(self._names)
                         self._names.append(b)
                         self._namesreverse[b] = branchidx
                     reponode = changelog.node(rev)
                     if close:
                         branchidx |= _rbccloseflag
                     self._setcachedata(rev, reponode, branchidx)
                     return b, close
                 def setdata(self, branch, rev, node, close):
                     """add new data information to the cache"""
                     if branch in self._namesreverse:
                         branchidx = self._namesreverse[branch]
                     else:
                         branchidx = len(self._names)
                         self._names.append(branch)
                         self._namesreverse[branch] = branchidx
                     if close:
                         branchidx |= _rbccloseflag
                     self._setcachedata(rev, node, branchidx)
                     # If no cache data were readable (non exists, bad permission, etc)
                     # the cache was bypassing itself by setting:
                     #
                     #   self.branchinfo = self._branchinfo
                     #
                     # Since we now have data in the cache, we need to drop this bypassing.
                     if r'branchinfo' in vars(self):
                         del self.branchinfo
                 def _setcachedata(self, rev, node, branchidx):
                     """Writes the node's branch data to the in-memory cache data."""
                     if rev == nullrev:
                         return
                     rbcrevidx = rev * _rbcrecsize
                     if len(self._rbcrevs) < rbcrevidx + _rbcrecsize:
                         self._rbcrevs.extend(
                             b'\0'
                             * (len(self._repo.changelog) * _rbcrecsize - len(self._rbcrevs))
                         )
                     pack_into(_rbcrecfmt, self._rbcrevs, rbcrevidx, node, branchidx)
                     self._rbcrevslen = min(self._rbcrevslen, rev)
                     tr = self._repo.currenttransaction()
                     if tr:
                         tr.addfinalize(b'write-revbranchcache', self.write)
                 def write(self, tr=None):
                     """Save branch cache if it is dirty."""
                     repo = self._repo
                     wlock = None
                     step = b''
                     try:
                         # write the new names
                         if self._rbcnamescount < len(self._names):
                             wlock = repo.wlock(wait=False)
                             step = b' names'
                             self._writenames(repo)
                         # write the new revs
                         start = self._rbcrevslen * _rbcrecsize
                         if start != len(self._rbcrevs):
                             step = b''
                             if wlock is None:
                                 wlock = repo.wlock(wait=False)
                             self._writerevs(repo, start)
                     except (IOError, OSError, error.Abort, error.LockError) as inst:
                         repo.ui.debug(
                             b"couldn't write revision branch cache%s: %s\n"
                             % (step, stringutil.forcebytestr(inst))
                         )
                     finally:
                         if wlock is not None:
                             wlock.release()
                 def _writenames(self, repo):
                     """ write the new branch names to revbranchcache """
                     if self._rbcnamescount != 0:
                         f = repo.cachevfs.open(_rbcnames, b'ab')
                         if f.tell() == self._rbcsnameslen:
                             f.write(b'\0')
                         else:
                             f.close()
                             repo.ui.debug(b"%s changed - rewriting it\n" % _rbcnames)
                             self._rbcnamescount = 0
                             self._rbcrevslen = 0
                     if self._rbcnamescount == 0:
                         # before rewriting names, make sure references are removed
                         repo.cachevfs.unlinkpath(_rbcrevs, ignoremissing=True)
                         f = repo.cachevfs.open(_rbcnames, b'wb')
                     f.write(
                         b'\0'.join(
                             encoding.fromlocal(b)
                             for b in self._names[self._rbcnamescount :]
                         )
                     )
                     self._rbcsnameslen = f.tell()
                     f.close()
                     self._rbcnamescount = len(self._names)
                 def _writerevs(self, repo, start):
                     """ write the new revs to revbranchcache """
                     revs = min(len(repo.changelog), len(self._rbcrevs) // _rbcrecsize)
                     with repo.cachevfs.open(_rbcrevs, b'ab') as f:
                         if f.tell() != start:
                             repo.ui.debug(
                                 b"truncating cache/%s to %d\n" % (_rbcrevs, start)
                             )
                             f.seek(start)
                             if f.tell() != start:
                                 start = 0
                                 f.seek(start)
                             f.truncate()
                         end = revs * _rbcrecsize
                         f.write(self._rbcrevs[start:end])
                     self._rbcrevslen = revs