upstream/mercurial-mirror Commit - r44812:6ecc34b3

1

# nodemap.py - nodemap related code and utilities

1

# nodemap.py - nodemap related code and utilities

2

#

2

#

3

4

5

#

5

#

6

# This software may be used and distributed according to the terms of the

6

# This software may be used and distributed according to the terms of the

7

# GNU General Public License version 2 or any later version.

7

# GNU General Public License version 2 or any later version.

8

9

from __future__ import absolute_import

9

from __future__ import absolute_import

10

11

import os

11

import os

12

import re

12

import re

13

import struct

13

import struct

14

15

from .. import (

15

from .. import (

16

error,

16

error,

17

node as nodemod,

17

node as nodemod,

18

util,

18

util,

19

)

19

)

20

21

22

class NodeMap(dict):

22

class NodeMap(dict):

23

def __missing__(self, x):

23

def __missing__(self, x):

24

raise error.RevlogError(b'unknown node: %s' % x)

24

raise error.RevlogError(b'unknown node: %s' % x)

25

26

27

def persisted_data(revlog):

27

def persisted_data(revlog):

28

"""read the nodemap for a revlog from disk"""

28

"""read the nodemap for a revlog from disk"""

29

if revlog.nodemap_file is None:

29

if revlog.nodemap_file is None:

30

return None

30

return None

31

pdata = revlog.opener.tryread(revlog.nodemap_file)

31

pdata = revlog.opener.tryread(revlog.nodemap_file)

32

if not pdata:

32

if not pdata:

33

return None

33

return None

34

offset = 0

34

offset = 0

35

(version,) = S_VERSION.unpack(pdata[offset : offset + S_VERSION.size])

35

(version,) = S_VERSION.unpack(pdata[offset : offset + S_VERSION.size])

36

if version != ONDISK_VERSION:

36

if version != ONDISK_VERSION:

37

return None

37

return None

38

offset += S_VERSION.size

38

offset += S_VERSION.size

39

headers = S_HEADER.unpack(pdata[offset : offset + S_HEADER.size])

39

headers = S_HEADER.unpack(pdata[offset : offset + S_HEADER.size])

40

uid_size, tip_rev, data_length, data_unused = headers

40

uid_size, tip_rev, data_length, data_unused = headers

41

offset += S_HEADER.size

41

offset += S_HEADER.size

42

docket = NodeMapDocket(pdata[offset : offset + uid_size])

42

docket = NodeMapDocket(pdata[offset : offset + uid_size])

43

docket.tip_rev = tip_rev

43

docket.tip_rev = tip_rev

44

docket.data_length = data_length

44

docket.data_length = data_length

45

docket.data_unused = data_unused

45

docket.data_unused = data_unused

46

47

filename = _rawdata_filepath(revlog, docket)

47

filename = _rawdata_filepath(revlog, docket)

48

data = revlog.opener.tryread(filename)

48

data = revlog.opener.tryread(filename)

49

if len(data) < data_length:

49

if len(data) < data_length:

50

return None

50

return None

51

elif len(data) > data_length:

51

elif len(data) > data_length:

52

data = data[:data_length]

52

data = data[:data_length]

53

return docket, data

53

return docket, data

54

55

56

def setup_persistent_nodemap(tr, revlog):

56

def setup_persistent_nodemap(tr, revlog):

57

"""Install whatever is needed transaction side to persist a nodemap on disk

57

"""Install whatever is needed transaction side to persist a nodemap on disk

58

59

(only actually persist the nodemap if this is relevant for this revlog)

59

(only actually persist the nodemap if this is relevant for this revlog)

60

"""

60

"""

61

if revlog._inline:

61

if revlog._inline:

62

return # inlined revlog are too small for this to be relevant

62

return # inlined revlog are too small for this to be relevant

63

if revlog.nodemap_file is None:

63

if revlog.nodemap_file is None:

64

return # we do not use persistent_nodemap on this revlog

64

return # we do not use persistent_nodemap on this revlog

65

callback_id = b"revlog-persistent-nodemap-%s" % revlog.nodemap_file

65

callback_id = b"revlog-persistent-nodemap-%s" % revlog.nodemap_file

66

if tr.hasfinalize(callback_id):

66

if tr.hasfinalize(callback_id):

67

return # no need to register again

67

return # no need to register again

68

tr.addfinalize(callback_id, lambda tr: _persist_nodemap(tr, revlog))

68

tr.addfinalize(callback_id, lambda tr: _persist_nodemap(tr, revlog))

69

70

71

def _persist_nodemap(tr, revlog):

71

def _persist_nodemap(tr, revlog):

72

"""Write nodemap data on disk for a given revlog

72

"""Write nodemap data on disk for a given revlog

73

"""

73

"""

74

if getattr(revlog, 'filteredrevs', ()):

74

if getattr(revlog, 'filteredrevs', ()):

75

raise error.ProgrammingError(

75

raise error.ProgrammingError(

76

"cannot persist nodemap of a filtered changelog"

76

"cannot persist nodemap of a filtered changelog"

77

)

77

)

78

if revlog.nodemap_file is None:

78

if revlog.nodemap_file is None:

79

msg = "calling persist nodemap on a revlog without the feature enableb"

79

msg = "calling persist nodemap on a revlog without the feature enableb"

80

raise error.ProgrammingError(msg)

80

raise error.ProgrammingError(msg)

81

82

can_incremental = util.safehasattr(revlog.index, "nodemap_data_incremental")

82

can_incremental = util.safehasattr(revlog.index, "nodemap_data_incremental")

83

ondisk_docket = revlog._nodemap_docket

83

ondisk_docket = revlog._nodemap_docket

84

85

data = None

85

data = None

86

# first attemp an incremental update of the data

86

# first attemp an incremental update of the data

87

if can_incremental and ondisk_docket is not None:

87

if can_incremental and ondisk_docket is not None:

88

target_docket = revlog._nodemap_docket.copy()

88

target_docket = revlog._nodemap_docket.copy()

89

(

89

(

90

src_docket,

90

src_docket,

91

data_changed_count,

91

data_changed_count,

92

data,

92

data,

93

) = revlog.index.nodemap_data_incremental()

93

) = revlog.index.nodemap_data_incremental()

94

if src_docket != target_docket:

94

if src_docket != target_docket:

95

data = None

95

data = None

96

else:

96

else:

97

datafile = _rawdata_filepath(revlog, target_docket)

97

datafile = _rawdata_filepath(revlog, target_docket)

98

# EXP-TODO: if this is a cache, this should use a cache vfs, not a

98

# EXP-TODO: if this is a cache, this should use a cache vfs, not a

99

# store vfs

99

# store vfs

100

with revlog.opener(datafile, b'r+') as fd:

100

with revlog.opener(datafile, b'r+') as fd:

101

fd.seek(target_docket.data_length)

101

fd.seek(target_docket.data_length)

102

fd.write(data)

102

fd.write(data)

103

fd.seek(0)

104

new_data = fd.read(target_docket.data_length + len(data))

103

target_docket.data_length += len(data)

105

target_docket.data_length += len(data)

104

target_docket.data_unused += data_changed_count

106

target_docket.data_unused += data_changed_count

105

107

106

if data is None:

108

if data is None:

107

# otherwise fallback to a full new export

109

# otherwise fallback to a full new export

108

target_docket = NodeMapDocket()

110

target_docket = NodeMapDocket()

109

datafile = _rawdata_filepath(revlog, target_docket)

111

datafile = _rawdata_filepath(revlog, target_docket)

110

if util.safehasattr(revlog.index, "nodemap_data_all"):

112

if util.safehasattr(revlog.index, "nodemap_data_all"):

111

data = revlog.index.nodemap_data_all()

113

data = revlog.index.nodemap_data_all()

112

else:

114

else:

113

data = persistent_data(revlog.index)

115

data = persistent_data(revlog.index)

114

# EXP-TODO: if this is a cache, this should use a cache vfs, not a

116

# EXP-TODO: if this is a cache, this should use a cache vfs, not a

115

# store vfs

117

# store vfs

118

new_data = data

116

with revlog.opener(datafile, b'w') as fd:

119

with revlog.opener(datafile, b'w') as fd:

117

fd.write(data)

120

fd.write(data)

118

target_docket.data_length = len(data)

121

target_docket.data_length = len(data)

119

target_docket.tip_rev = revlog.tiprev()

122

target_docket.tip_rev = revlog.tiprev()

120

# EXP-TODO: if this is a cache, this should use a cache vfs, not a

123

# EXP-TODO: if this is a cache, this should use a cache vfs, not a

121

# store vfs

124

# store vfs

122

with revlog.opener(revlog.nodemap_file, b'w', atomictemp=True) as fp:

125

with revlog.opener(revlog.nodemap_file, b'w', atomictemp=True) as fp:

123

fp.write(target_docket.serialize())

126

fp.write(target_docket.serialize())

124

revlog._nodemap_docket = target_docket

127

revlog._nodemap_docket = target_docket

128

if util.safehasattr(revlog.index, "update_nodemap_data"):

129

revlog.index.update_nodemap_data(target_docket, new_data)

130

125

# EXP-TODO: if the transaction abort, we should remove the new data and

131

# EXP-TODO: if the transaction abort, we should remove the new data and

126

# reinstall the old one.

132

# reinstall the old one.

127

133

128

# search for old index file in all cases, some older process might have

134

# search for old index file in all cases, some older process might have

129

# left one behind.

135

# left one behind.

130

olds = _other_rawdata_filepath(revlog, target_docket)

136

olds = _other_rawdata_filepath(revlog, target_docket)

131

if olds:

137

if olds:

132

realvfs = getattr(revlog, '_realopener', revlog.opener)

138

realvfs = getattr(revlog, '_realopener', revlog.opener)

133

139

134

def cleanup(tr):

140

def cleanup(tr):

135

for oldfile in olds:

141

for oldfile in olds:

136

realvfs.tryunlink(oldfile)

142

realvfs.tryunlink(oldfile)

137

143

138

callback_id = b"revlog-cleanup-nodemap-%s" % revlog.nodemap_file

144

callback_id = b"revlog-cleanup-nodemap-%s" % revlog.nodemap_file

139

tr.addpostclose(callback_id, cleanup)

145

tr.addpostclose(callback_id, cleanup)

140

146

141

147

142

### Nodemap docket file

148

### Nodemap docket file

143

#

149

#

144

# The nodemap data are stored on disk using 2 files:

150

# The nodemap data are stored on disk using 2 files:

145

#

151

#

146

# * a raw data files containing a persistent nodemap

152

# * a raw data files containing a persistent nodemap

147

# (see `Nodemap Trie` section)

153

# (see `Nodemap Trie` section)

148

#

154

#

149

# * a small "docket" file containing medatadata

155

# * a small "docket" file containing medatadata

150

#

156

#

151

# While the nodemap data can be multiple tens of megabytes, the "docket" is

157

# While the nodemap data can be multiple tens of megabytes, the "docket" is

152

# small, it is easy to update it automatically or to duplicated its content

158

# small, it is easy to update it automatically or to duplicated its content

153

# during a transaction.

159

# during a transaction.

154

#

160

#

155

# Multiple raw data can exist at the same time (The currently valid one and a

161

# Multiple raw data can exist at the same time (The currently valid one and a

156

# new one beind used by an in progress transaction). To accomodate this, the

162

# new one beind used by an in progress transaction). To accomodate this, the

157

# filename hosting the raw data has a variable parts. The exact filename is

163

# filename hosting the raw data has a variable parts. The exact filename is

158

# specified inside the "docket" file.

164

# specified inside the "docket" file.

159

#

165

#

160

# The docket file contains information to find, qualify and validate the raw

166

# The docket file contains information to find, qualify and validate the raw

161

# data. Its content is currently very light, but it will expand as the on disk

167

# data. Its content is currently very light, but it will expand as the on disk

162

# nodemap gains the necessary features to be used in production.

168

# nodemap gains the necessary features to be used in production.

163

169

164

# version 0 is experimental, no BC garantee, do no use outside of tests.

170

# version 0 is experimental, no BC garantee, do no use outside of tests.

165

ONDISK_VERSION = 0

171

ONDISK_VERSION = 0

166

S_VERSION = struct.Struct(">B")

172

S_VERSION = struct.Struct(">B")

167

S_HEADER = struct.Struct(">BQQQ")

173

S_HEADER = struct.Struct(">BQQQ")

168

174

169

ID_SIZE = 8

175

ID_SIZE = 8

170

176

171

177

172

def _make_uid():

178

def _make_uid():

173

"""return a new unique identifier.

179

"""return a new unique identifier.

174

180

175

The identifier is random and composed of ascii characters."""

181

The identifier is random and composed of ascii characters."""

176

return nodemod.hex(os.urandom(ID_SIZE))

182

return nodemod.hex(os.urandom(ID_SIZE))

177

183

178

184

179

class NodeMapDocket(object):

185

class NodeMapDocket(object):

180

"""metadata associated with persistent nodemap data

186

"""metadata associated with persistent nodemap data

181

187

182

The persistent data may come from disk or be on their way to disk.

188

The persistent data may come from disk or be on their way to disk.

183

"""

189

"""

184

190

185

def __init__(self, uid=None):

191

def __init__(self, uid=None):

186

if uid is None:

192

if uid is None:

187

uid = _make_uid()

193

uid = _make_uid()

188

self.uid = uid

194

self.uid = uid

189

self.tip_rev = None

195

self.tip_rev = None

190

self.data_length = None

196

self.data_length = None

191

self.data_unused = 0

197

self.data_unused = 0

192

198

193

def copy(self):

199

def copy(self):

194

new = NodeMapDocket(uid=self.uid)

200

new = NodeMapDocket(uid=self.uid)

195

new.tip_rev = self.tip_rev

201

new.tip_rev = self.tip_rev

196

new.data_length = self.data_length

202

new.data_length = self.data_length

197

new.data_unused = self.data_unused

203

new.data_unused = self.data_unused

198

return new

204

return new

199

205

200

def __cmp__(self, other):

206

def __cmp__(self, other):

201

if self.uid < other.uid:

207

if self.uid < other.uid:

202

return -1

208

return -1

203

if self.uid > other.uid:

209

if self.uid > other.uid:

204

return 1

210

return 1

205

elif self.data_length < other.data_length:

211

elif self.data_length < other.data_length:

206

return -1

212

return -1

207

elif self.data_length > other.data_length:

213

elif self.data_length > other.data_length:

208

return 1

214

return 1

209

return 0

215

return 0

210

216

211

def __eq__(self, other):

217

def __eq__(self, other):

212

return self.uid == other.uid and self.data_length == other.data_length

218

return self.uid == other.uid and self.data_length == other.data_length

213

219

214

def serialize(self):

220

def serialize(self):

215

"""return serialized bytes for a docket using the passed uid"""

221

"""return serialized bytes for a docket using the passed uid"""

216

data = []

222

data = []

217

data.append(S_VERSION.pack(ONDISK_VERSION))

223

data.append(S_VERSION.pack(ONDISK_VERSION))

218

headers = (

224

headers = (

219

len(self.uid),

225

len(self.uid),

220

self.tip_rev,

226

self.tip_rev,

221

self.data_length,

227

self.data_length,

222

self.data_unused,

228

self.data_unused,

223

)

229

)

224

data.append(S_HEADER.pack(*headers))

230

data.append(S_HEADER.pack(*headers))

225

data.append(self.uid)

231

data.append(self.uid)

226

return b''.join(data)

232

return b''.join(data)

227

233

228

234

229

def _rawdata_filepath(revlog, docket):

235

def _rawdata_filepath(revlog, docket):

230

"""The (vfs relative) nodemap's rawdata file for a given uid"""

236

"""The (vfs relative) nodemap's rawdata file for a given uid"""

231

prefix = revlog.nodemap_file[:-2]

237

prefix = revlog.nodemap_file[:-2]

232

return b"%s-%s.nd" % (prefix, docket.uid)

238

return b"%s-%s.nd" % (prefix, docket.uid)

233

239

234

240

235

def _other_rawdata_filepath(revlog, docket):

241

def _other_rawdata_filepath(revlog, docket):

236

prefix = revlog.nodemap_file[:-2]

242

prefix = revlog.nodemap_file[:-2]

237

pattern = re.compile(b"(^|/)%s-[0-9a-f]+\.nd$" % prefix)

243

pattern = re.compile(b"(^|/)%s-[0-9a-f]+\.nd$" % prefix)

238

new_file_path = _rawdata_filepath(revlog, docket)

244

new_file_path = _rawdata_filepath(revlog, docket)

239

new_file_name = revlog.opener.basename(new_file_path)

245

new_file_name = revlog.opener.basename(new_file_path)

240

dirpath = revlog.opener.dirname(new_file_path)

246

dirpath = revlog.opener.dirname(new_file_path)

241

others = []

247

others = []

242

for f in revlog.opener.listdir(dirpath):

248

for f in revlog.opener.listdir(dirpath):

243

if pattern.match(f) and f != new_file_name:

249

if pattern.match(f) and f != new_file_name:

244

others.append(f)

250

others.append(f)

245

return others

251

return others

246

252

247

253

248

### Nodemap Trie

254

### Nodemap Trie

249

#

255

#

250

# This is a simple reference implementation to compute and persist a nodemap

256

# This is a simple reference implementation to compute and persist a nodemap

251

# trie. This reference implementation is write only. The python version of this

257

# trie. This reference implementation is write only. The python version of this

252

# is not expected to be actually used, since it wont provide performance

258

# is not expected to be actually used, since it wont provide performance

253

# improvement over existing non-persistent C implementation.

259

# improvement over existing non-persistent C implementation.

254

#

260

#

255

# The nodemap is persisted as Trie using 4bits-address/16-entries block. each

261

# The nodemap is persisted as Trie using 4bits-address/16-entries block. each

256

# revision can be adressed using its node shortest prefix.

262

# revision can be adressed using its node shortest prefix.

257

#

263

#

258

# The trie is stored as a sequence of block. Each block contains 16 entries

264

# The trie is stored as a sequence of block. Each block contains 16 entries

259

# (signed 64bit integer, big endian). Each entry can be one of the following:

265

# (signed 64bit integer, big endian). Each entry can be one of the following:

260

#

266

#

261

# * value >= 0 -> index of sub-block

267

# * value >= 0 -> index of sub-block

262

# * value == -1 -> no value

268

# * value == -1 -> no value

263

# * value < -1 -> a revision value: rev = -(value+10)

269

# * value < -1 -> a revision value: rev = -(value+10)

264

#

270

#

265

# The implementation focus on simplicity, not on performance. A Rust

271

# The implementation focus on simplicity, not on performance. A Rust

266

# implementation should provide a efficient version of the same binary

272

# implementation should provide a efficient version of the same binary

267

# persistence. This reference python implementation is never meant to be

273

# persistence. This reference python implementation is never meant to be

268

# extensively use in production.

274

# extensively use in production.

269

275

270

276

271

def persistent_data(index):

277

def persistent_data(index):

272

"""return the persistent binary form for a nodemap for a given index

278

"""return the persistent binary form for a nodemap for a given index

273

"""

279

"""

274

trie = _build_trie(index)

280

trie = _build_trie(index)

275

return _persist_trie(trie)

281

return _persist_trie(trie)

276

282

277

283

278

def update_persistent_data(index, root, max_idx, last_rev):

284

def update_persistent_data(index, root, max_idx, last_rev):

279

"""return the incremental update for persistent nodemap from a given index

285

"""return the incremental update for persistent nodemap from a given index

280

"""

286

"""

281

changed_block, trie = _update_trie(index, root, last_rev)

287

changed_block, trie = _update_trie(index, root, last_rev)

282

return (

288

return (

283

changed_block * S_BLOCK.size,

289

changed_block * S_BLOCK.size,

284

_persist_trie(trie, existing_idx=max_idx),

290

_persist_trie(trie, existing_idx=max_idx),

285

)

291

)

286

292

287

293

288

S_BLOCK = struct.Struct(">" + ("l" * 16))

294

S_BLOCK = struct.Struct(">" + ("l" * 16))

289

295

290

NO_ENTRY = -1

296

NO_ENTRY = -1

291

# rev 0 need to be -2 because 0 is used by block, -1 is a special value.

297

# rev 0 need to be -2 because 0 is used by block, -1 is a special value.

292

REV_OFFSET = 2

298

REV_OFFSET = 2

293

299

294

300

295

def _transform_rev(rev):

301

def _transform_rev(rev):

296

"""Return the number used to represent the rev in the tree.

302

"""Return the number used to represent the rev in the tree.

297

303

298

(or retrieve a rev number from such representation)

304

(or retrieve a rev number from such representation)

299

305

300

Note that this is an involution, a function equal to its inverse (i.e.

306

Note that this is an involution, a function equal to its inverse (i.e.

301

which gives the identity when applied to itself).

307

which gives the identity when applied to itself).

302

"""

308

"""

303

return -(rev + REV_OFFSET)

309

return -(rev + REV_OFFSET)

304

310

305

311

306

def _to_int(hex_digit):

312

def _to_int(hex_digit):

307

"""turn an hexadecimal digit into a proper integer"""

313

"""turn an hexadecimal digit into a proper integer"""

308

return int(hex_digit, 16)

314

return int(hex_digit, 16)

309

315

310

316

311

class Block(dict):

317

class Block(dict):

312

"""represent a block of the Trie

318

"""represent a block of the Trie

313

319

314

contains up to 16 entry indexed from 0 to 15"""

320

contains up to 16 entry indexed from 0 to 15"""

315

321

316

def __init__(self):

322

def __init__(self):

317

super(Block, self).__init__()

323

super(Block, self).__init__()

318

# If this block exist on disk, here is its ID

324

# If this block exist on disk, here is its ID

319

self.ondisk_id = None

325

self.ondisk_id = None

320

326

321

def __iter__(self):

327

def __iter__(self):

322

return iter(self.get(i) for i in range(16))

328

return iter(self.get(i) for i in range(16))

323

329

324

330

325

def _build_trie(index):

331

def _build_trie(index):

326

"""build a nodemap trie

332

"""build a nodemap trie

327

333

328

The nodemap stores revision number for each unique prefix.

334

The nodemap stores revision number for each unique prefix.

329

335

330

Each block is a dictionary with keys in `[0, 15]`. Values are either

336

Each block is a dictionary with keys in `[0, 15]`. Values are either

331

another block or a revision number.

337

another block or a revision number.

332

"""

338

"""

333

root = Block()

339

root = Block()

334

for rev in range(len(index)):

340

for rev in range(len(index)):

335

hex = nodemod.hex(index[rev][7])

341

hex = nodemod.hex(index[rev][7])

336

_insert_into_block(index, 0, root, rev, hex)

342

_insert_into_block(index, 0, root, rev, hex)

337

return root

343

return root

338

344

339

345

340

def _update_trie(index, root, last_rev):

346

def _update_trie(index, root, last_rev):

341

"""consume"""

347

"""consume"""

342

changed = 0

348

changed = 0

343

for rev in range(last_rev + 1, len(index)):

349

for rev in range(last_rev + 1, len(index)):

344

hex = nodemod.hex(index[rev][7])

350

hex = nodemod.hex(index[rev][7])

345

changed += _insert_into_block(index, 0, root, rev, hex)

351

changed += _insert_into_block(index, 0, root, rev, hex)

346

return changed, root

352

return changed, root

347

353

348

354

349

def _insert_into_block(index, level, block, current_rev, current_hex):

355

def _insert_into_block(index, level, block, current_rev, current_hex):

350

"""insert a new revision in a block

356

"""insert a new revision in a block

351

357

352

index: the index we are adding revision for

358

index: the index we are adding revision for

353

level: the depth of the current block in the trie

359

level: the depth of the current block in the trie

354

block: the block currently being considered

360

block: the block currently being considered

355

current_rev: the revision number we are adding

361

current_rev: the revision number we are adding

356

current_hex: the hexadecimal representation of the of that revision

362

current_hex: the hexadecimal representation of the of that revision

357

"""

363

"""

358

changed = 1

364

changed = 1

359

if block.ondisk_id is not None:

365

if block.ondisk_id is not None:

360

block.ondisk_id = None

366

block.ondisk_id = None

361

hex_digit = _to_int(current_hex[level : level + 1])

367

hex_digit = _to_int(current_hex[level : level + 1])

362

entry = block.get(hex_digit)

368

entry = block.get(hex_digit)

363

if entry is None:

369

if entry is None:

364

# no entry, simply store the revision number

370

# no entry, simply store the revision number

365

block[hex_digit] = current_rev

371

block[hex_digit] = current_rev

366

elif isinstance(entry, dict):

372

elif isinstance(entry, dict):

367

# need to recurse to an underlying block

373

# need to recurse to an underlying block

368

changed += _insert_into_block(

374

changed += _insert_into_block(

369

index, level + 1, entry, current_rev, current_hex

375

index, level + 1, entry, current_rev, current_hex

370

)

376

)

371

else:

377

else:

372

# collision with a previously unique prefix, inserting new

378

# collision with a previously unique prefix, inserting new

373

# vertices to fit both entry.

379

# vertices to fit both entry.

374

other_hex = nodemod.hex(index[entry][7])

380

other_hex = nodemod.hex(index[entry][7])

375

other_rev = entry

381

other_rev = entry

376

new = Block()

382

new = Block()

377

block[hex_digit] = new

383

block[hex_digit] = new

378

_insert_into_block(index, level + 1, new, other_rev, other_hex)

384

_insert_into_block(index, level + 1, new, other_rev, other_hex)

379

_insert_into_block(index, level + 1, new, current_rev, current_hex)

385

_insert_into_block(index, level + 1, new, current_rev, current_hex)

380

return changed

386

return changed

381

387

382

388

383

def _persist_trie(root, existing_idx=None):

389

def _persist_trie(root, existing_idx=None):

384

"""turn a nodemap trie into persistent binary data

390

"""turn a nodemap trie into persistent binary data

385

391

386

See `_build_trie` for nodemap trie structure"""

392

See `_build_trie` for nodemap trie structure"""

387

block_map = {}

393

block_map = {}

388

if existing_idx is not None:

394

if existing_idx is not None:

389

base_idx = existing_idx + 1

395

base_idx = existing_idx + 1

390

else:

396

else:

391

base_idx = 0

397

base_idx = 0

392

chunks = []

398

chunks = []

393

for tn in _walk_trie(root):

399

for tn in _walk_trie(root):

394

if tn.ondisk_id is not None:

400

if tn.ondisk_id is not None:

395

block_map[id(tn)] = tn.ondisk_id

401

block_map[id(tn)] = tn.ondisk_id

396

else:

402

else:

397

block_map[id(tn)] = len(chunks) + base_idx

403

block_map[id(tn)] = len(chunks) + base_idx

398

chunks.append(_persist_block(tn, block_map))

404

chunks.append(_persist_block(tn, block_map))

399

return b''.join(chunks)

405

return b''.join(chunks)

400

406

401

407

402

def _walk_trie(block):

408

def _walk_trie(block):

403

"""yield all the block in a trie

409

"""yield all the block in a trie

404

410

405

Children blocks are always yield before their parent block.

411

Children blocks are always yield before their parent block.

406

"""

412

"""

407

for (_, item) in sorted(block.items()):

413

for (_, item) in sorted(block.items()):

408

if isinstance(item, dict):

414

if isinstance(item, dict):

409

for sub_block in _walk_trie(item):

415

for sub_block in _walk_trie(item):

410

yield sub_block

416

yield sub_block

411

yield block

417

yield block

412

418

413

419

414

def _persist_block(block_node, block_map):

420

def _persist_block(block_node, block_map):

415

"""produce persistent binary data for a single block

421

"""produce persistent binary data for a single block

416

422

417

Children block are assumed to be already persisted and present in

423

Children block are assumed to be already persisted and present in

418

block_map.

424

block_map.

419

"""

425

"""

420

data = tuple(_to_value(v, block_map) for v in block_node)

426

data = tuple(_to_value(v, block_map) for v in block_node)

421

return S_BLOCK.pack(*data)

427

return S_BLOCK.pack(*data)

422

428

423

429

424

def _to_value(item, block_map):

430

def _to_value(item, block_map):

425

"""persist any value as an integer"""

431

"""persist any value as an integer"""

426

if item is None:

432

if item is None:

427

return NO_ENTRY

433

return NO_ENTRY

428

elif isinstance(item, dict):

434

elif isinstance(item, dict):

429

return block_map[id(item)]

435

return block_map[id(item)]

430

else:

436

else:

431

return _transform_rev(item)

437

return _transform_rev(item)

432

438

433

439

434

def parse_data(data):

440

def parse_data(data):

435

"""parse parse nodemap data into a nodemap Trie"""

441

"""parse parse nodemap data into a nodemap Trie"""

436

if (len(data) % S_BLOCK.size) != 0:

442

if (len(data) % S_BLOCK.size) != 0:

437

msg = "nodemap data size is not a multiple of block size (%d): %d"

443

msg = "nodemap data size is not a multiple of block size (%d): %d"

438

raise error.Abort(msg % (S_BLOCK.size, len(data)))

444

raise error.Abort(msg % (S_BLOCK.size, len(data)))

439

if not data:

445

if not data:

440

return Block(), None

446

return Block(), None

441

block_map = {}

447

block_map = {}

442

new_blocks = []

448

new_blocks = []

443

for i in range(0, len(data), S_BLOCK.size):

449

for i in range(0, len(data), S_BLOCK.size):

444

block = Block()

450

block = Block()

445

block.ondisk_id = len(block_map)

451

block.ondisk_id = len(block_map)

446

block_map[block.ondisk_id] = block

452

block_map[block.ondisk_id] = block

447

block_data = data[i : i + S_BLOCK.size]

453

block_data = data[i : i + S_BLOCK.size]

448

values = S_BLOCK.unpack(block_data)

454

values = S_BLOCK.unpack(block_data)

449

new_blocks.append((block, values))

455

new_blocks.append((block, values))

450

for b, values in new_blocks:

456

for b, values in new_blocks:

451

for idx, v in enumerate(values):

457

for idx, v in enumerate(values):

452

if v == NO_ENTRY:

458

if v == NO_ENTRY:

453

continue

459

continue

454

elif v >= 0:

460

elif v >= 0:

455

b[idx] = block_map[v]

461

b[idx] = block_map[v]

456

else:

462

else:

457

b[idx] = _transform_rev(v)

463

b[idx] = _transform_rev(v)

458

return block, i // S_BLOCK.size

464

return block, i // S_BLOCK.size

459

465

460

466

461

# debug utility

467

# debug utility

462

468

463

469

464

def check_data(ui, index, data):

470

def check_data(ui, index, data):

465

"""verify that the provided nodemap data are valid for the given idex"""

471

"""verify that the provided nodemap data are valid for the given idex"""

466

ret = 0

472

ret = 0

467

ui.status((b"revision in index: %d\n") % len(index))

473

ui.status((b"revision in index: %d\n") % len(index))

468

root, __ = parse_data(data)

474

root, __ = parse_data(data)

469

all_revs = set(_all_revisions(root))

475

all_revs = set(_all_revisions(root))

470

ui.status((b"revision in nodemap: %d\n") % len(all_revs))

476

ui.status((b"revision in nodemap: %d\n") % len(all_revs))

471

for r in range(len(index)):

477

for r in range(len(index)):

472

if r not in all_revs:

478

if r not in all_revs:

473

msg = b" revision missing from nodemap: %d\n" % r

479

msg = b" revision missing from nodemap: %d\n" % r

474

ui.write_err(msg)

480

ui.write_err(msg)

475

ret = 1

481

ret = 1

476

else:

482

else:

477

all_revs.remove(r)

483

all_revs.remove(r)

478

nm_rev = _find_node(root, nodemod.hex(index[r][7]))

484

nm_rev = _find_node(root, nodemod.hex(index[r][7]))

479

if nm_rev is None:

485

if nm_rev is None:

480

msg = b" revision node does not match any entries: %d\n" % r

486

msg = b" revision node does not match any entries: %d\n" % r

481

ui.write_err(msg)

487

ui.write_err(msg)

482

ret = 1

488

ret = 1

483

elif nm_rev != r:

489

elif nm_rev != r:

484

msg = (

490

msg = (

485

b" revision node does not match the expected revision: "

491

b" revision node does not match the expected revision: "

486

b"%d != %d\n" % (r, nm_rev)

492

b"%d != %d\n" % (r, nm_rev)

487

)

493

)

488

ui.write_err(msg)

494

ui.write_err(msg)

489

ret = 1

495

ret = 1

490

496

491

if all_revs:

497

if all_revs:

492

for r in sorted(all_revs):

498

for r in sorted(all_revs):

493

msg = b" extra revision in nodemap: %d\n" % r

499

msg = b" extra revision in nodemap: %d\n" % r

494

ui.write_err(msg)

500

ui.write_err(msg)

495

ret = 1

501

ret = 1

496

return ret

502

return ret

497

503

498

504

499

def _all_revisions(root):

505

def _all_revisions(root):

500

"""return all revisions stored in a Trie"""

506

"""return all revisions stored in a Trie"""

501

for block in _walk_trie(root):

507

for block in _walk_trie(root):

502

for v in block:

508

for v in block:

503

if v is None or isinstance(v, Block):

509

if v is None or isinstance(v, Block):

504

continue

510

continue

505

yield v

511

yield v

506

512

507

513

508

def _find_node(block, node):

514

def _find_node(block, node):

509

"""find the revision associated with a given node"""

515

"""find the revision associated with a given node"""

510

entry = block.get(_to_int(node[0:1]))

516

entry = block.get(_to_int(node[0:1]))

511

if isinstance(entry, dict):

517

if isinstance(entry, dict):

512

return _find_node(entry, node[1:])

518

return _find_node(entry, node[1:])

513

return entry

519

return entry

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # nodemap.py - nodemap related code and utilities
             #
             # Copyright 2019 Pierre-Yves David <pierre-yves.david@octobus.net>
             # Copyright 2019 George Racinet <georges.racinet@octobus.net>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import os
             import re
             import struct
             from .. import (
                 error,
                 node as nodemod,
                 util,
             )
             class NodeMap(dict):
                 def __missing__(self, x):
                     raise error.RevlogError(b'unknown node: %s' % x)
             def persisted_data(revlog):
                 """read the nodemap for a revlog from disk"""
                 if revlog.nodemap_file is None:
                     return None
                 pdata = revlog.opener.tryread(revlog.nodemap_file)
                 if not pdata:
                     return None
                 offset = 0
                 (version,) = S_VERSION.unpack(pdata[offset : offset + S_VERSION.size])
                 if version != ONDISK_VERSION:
                     return None
                 offset += S_VERSION.size
                 headers = S_HEADER.unpack(pdata[offset : offset + S_HEADER.size])
                 uid_size, tip_rev, data_length, data_unused = headers
                 offset += S_HEADER.size
                 docket = NodeMapDocket(pdata[offset : offset + uid_size])
                 docket.tip_rev = tip_rev
                 docket.data_length = data_length
                 docket.data_unused = data_unused
                 filename = _rawdata_filepath(revlog, docket)
                 data = revlog.opener.tryread(filename)
                 if len(data) < data_length:
                     return None
                 elif len(data) > data_length:
                     data = data[:data_length]
                 return docket, data
             def setup_persistent_nodemap(tr, revlog):
                 """Install whatever is needed transaction side to persist a nodemap on disk
                 (only actually persist the nodemap if this is relevant for this revlog)
                 """
                 if revlog._inline:
                     return  # inlined revlog are too small for this to be relevant
                 if revlog.nodemap_file is None:
                     return  # we do not use persistent_nodemap on this revlog
                 callback_id = b"revlog-persistent-nodemap-%s" % revlog.nodemap_file
                 if tr.hasfinalize(callback_id):
                     return  # no need to register again
                 tr.addfinalize(callback_id, lambda tr: _persist_nodemap(tr, revlog))
             def _persist_nodemap(tr, revlog):
                 """Write nodemap data on disk for a given revlog
                 """
                 if getattr(revlog, 'filteredrevs', ()):
                     raise error.ProgrammingError(
                         "cannot persist nodemap of a filtered changelog"
                     )
                 if revlog.nodemap_file is None:
                     msg = "calling persist nodemap on a revlog without the feature enableb"
                     raise error.ProgrammingError(msg)
                 can_incremental = util.safehasattr(revlog.index, "nodemap_data_incremental")
                 ondisk_docket = revlog._nodemap_docket
                 data = None
                 # first attemp an incremental update of the data
                 if can_incremental and ondisk_docket is not None:
                     target_docket = revlog._nodemap_docket.copy()
                     (
                         src_docket,
                         data_changed_count,
                         data,
                     ) = revlog.index.nodemap_data_incremental()
                     if src_docket != target_docket:
                         data = None
                     else:
                         datafile = _rawdata_filepath(revlog, target_docket)
                         # EXP-TODO: if this is a cache, this should use a cache vfs, not a
                         # store vfs
                         with revlog.opener(datafile, b'r+') as fd:
                             fd.seek(target_docket.data_length)
                             fd.write(data)
+                            fd.seek(0)
+                            new_data = fd.read(target_docket.data_length + len(data))
                         target_docket.data_length += len(data)
                         target_docket.data_unused += data_changed_count
                 if data is None:
                     # otherwise fallback to a full new export
                     target_docket = NodeMapDocket()
                     datafile = _rawdata_filepath(revlog, target_docket)
                     if util.safehasattr(revlog.index, "nodemap_data_all"):
                         data = revlog.index.nodemap_data_all()
                     else:
                         data = persistent_data(revlog.index)
                     # EXP-TODO: if this is a cache, this should use a cache vfs, not a
                     # store vfs
+                    new_data = data
                     with revlog.opener(datafile, b'w') as fd:
                         fd.write(data)
                     target_docket.data_length = len(data)
                 target_docket.tip_rev = revlog.tiprev()
                 # EXP-TODO: if this is a cache, this should use a cache vfs, not a
                 # store vfs
                 with revlog.opener(revlog.nodemap_file, b'w', atomictemp=True) as fp:
                     fp.write(target_docket.serialize())
                 revlog._nodemap_docket = target_docket
+                if util.safehasattr(revlog.index, "update_nodemap_data"):
+                    revlog.index.update_nodemap_data(target_docket, new_data)
                 # EXP-TODO: if the transaction abort, we should remove the new data and
                 # reinstall the old one.
                 # search for old index file in all cases, some older process might have
                 # left one behind.
                 olds = _other_rawdata_filepath(revlog, target_docket)
                 if olds:
                     realvfs = getattr(revlog, '_realopener', revlog.opener)
                     def cleanup(tr):
                         for oldfile in olds:
                             realvfs.tryunlink(oldfile)
                     callback_id = b"revlog-cleanup-nodemap-%s" % revlog.nodemap_file
                     tr.addpostclose(callback_id, cleanup)
             ### Nodemap docket file
             #
             # The nodemap data are stored on disk using 2 files:
             #
             # * a raw data files containing a persistent nodemap
             #   (see `Nodemap Trie` section)
             #
             # * a small "docket" file containing medatadata
             #
             # While the nodemap data can be multiple tens of megabytes, the "docket" is
             # small, it is easy to update it automatically or to duplicated its content
             # during a transaction.
             #
             # Multiple raw data can exist at the same time (The currently valid one and a
             # new one beind used by an in progress transaction). To accomodate this, the
             # filename hosting the raw data has a variable parts. The exact filename is
             # specified inside the "docket" file.
             #
             # The docket file contains information to find, qualify and validate the raw
             # data. Its content is currently very light, but it will expand as the on disk
             # nodemap gains the necessary features to be used in production.
             # version 0 is experimental, no BC garantee, do no use outside of tests.
             ONDISK_VERSION = 0
             S_VERSION = struct.Struct(">B")
             S_HEADER = struct.Struct(">BQQQ")
             ID_SIZE = 8
             def _make_uid():
                 """return a new unique identifier.
                 The identifier is random and composed of ascii characters."""
                 return nodemod.hex(os.urandom(ID_SIZE))
             class NodeMapDocket(object):
                 """metadata associated with persistent nodemap data
                 The persistent data may come from disk or be on their way to disk.
                 """
                 def __init__(self, uid=None):
                     if uid is None:
                         uid = _make_uid()
                     self.uid = uid
                     self.tip_rev = None
                     self.data_length = None
                     self.data_unused = 0
                 def copy(self):
                     new = NodeMapDocket(uid=self.uid)
                     new.tip_rev = self.tip_rev
                     new.data_length = self.data_length
                     new.data_unused = self.data_unused
                     return new
                 def __cmp__(self, other):
                     if self.uid < other.uid:
                         return -1
                     if self.uid > other.uid:
                         return 1
                     elif self.data_length < other.data_length:
                         return -1
                     elif self.data_length > other.data_length:
                         return 1
                     return 0
                 def __eq__(self, other):
                     return self.uid == other.uid and self.data_length == other.data_length
                 def serialize(self):
                     """return serialized bytes for a docket using the passed uid"""
                     data = []
                     data.append(S_VERSION.pack(ONDISK_VERSION))
                     headers = (
                         len(self.uid),
                         self.tip_rev,
                         self.data_length,
                         self.data_unused,
                     )
                     data.append(S_HEADER.pack(*headers))
                     data.append(self.uid)
                     return b''.join(data)
             def _rawdata_filepath(revlog, docket):
                 """The (vfs relative) nodemap's rawdata file for a given uid"""
                 prefix = revlog.nodemap_file[:-2]
                 return b"%s-%s.nd" % (prefix, docket.uid)
             def _other_rawdata_filepath(revlog, docket):
                 prefix = revlog.nodemap_file[:-2]
                 pattern = re.compile(b"(^|/)%s-[0-9a-f]+\.nd$" % prefix)
                 new_file_path = _rawdata_filepath(revlog, docket)
                 new_file_name = revlog.opener.basename(new_file_path)
                 dirpath = revlog.opener.dirname(new_file_path)
                 others = []
                 for f in revlog.opener.listdir(dirpath):
                     if pattern.match(f) and f != new_file_name:
                         others.append(f)
                 return others
             ### Nodemap Trie
             #
             # This is a simple reference implementation to compute and persist a nodemap
             # trie. This reference implementation is write only. The python version of this
             # is not expected to be actually used, since it wont provide performance
             # improvement over existing non-persistent C implementation.
             #
             # The nodemap is persisted as Trie using 4bits-address/16-entries block. each
             # revision can be adressed using its node shortest prefix.
             #
             # The trie is stored as a sequence of block. Each block contains 16 entries
             # (signed 64bit integer, big endian). Each entry can be one of the following:
             #
             #  * value >=  0 -> index of sub-block
             #  * value == -1 -> no value
             #  * value <  -1 -> a revision value: rev = -(value+10)
             #
             # The implementation focus on simplicity, not on performance. A Rust
             # implementation should provide a efficient version of the same binary
             # persistence. This reference python implementation is never meant to be
             # extensively use in production.
             def persistent_data(index):
                 """return the persistent binary form for a nodemap for a given index
                 """
                 trie = _build_trie(index)
                 return _persist_trie(trie)
             def update_persistent_data(index, root, max_idx, last_rev):
                 """return the incremental update for persistent nodemap from a given index
                 """
                 changed_block, trie = _update_trie(index, root, last_rev)
                 return (
                     changed_block * S_BLOCK.size,
                     _persist_trie(trie, existing_idx=max_idx),
                 )
             S_BLOCK = struct.Struct(">" + ("l" * 16))
             NO_ENTRY = -1
             # rev 0 need to be -2 because 0 is used by block, -1 is a special value.
             REV_OFFSET = 2
             def _transform_rev(rev):
                 """Return the number used to represent the rev in the tree.
                 (or retrieve a rev number from such representation)
                 Note that this is an involution, a function equal to its inverse (i.e.
                 which gives the identity when applied to itself).
                 """
                 return -(rev + REV_OFFSET)
             def _to_int(hex_digit):
                 """turn an hexadecimal digit into a proper integer"""
                 return int(hex_digit, 16)
             class Block(dict):
                 """represent a block of the Trie
                 contains up to 16 entry indexed from 0 to 15"""
                 def __init__(self):
                     super(Block, self).__init__()
                     # If this block exist on disk, here is its ID
                     self.ondisk_id = None
                 def __iter__(self):
                     return iter(self.get(i) for i in range(16))
             def _build_trie(index):
                 """build a nodemap trie
                 The nodemap stores revision number for each unique prefix.
                 Each block is a dictionary with keys in `[0, 15]`. Values are either
                 another block or a revision number.
                 """
                 root = Block()
                 for rev in range(len(index)):
                     hex = nodemod.hex(index[rev][7])
                     _insert_into_block(index, 0, root, rev, hex)
                 return root
             def _update_trie(index, root, last_rev):
                 """consume"""
                 changed = 0
                 for rev in range(last_rev + 1, len(index)):
                     hex = nodemod.hex(index[rev][7])
                     changed += _insert_into_block(index, 0, root, rev, hex)
                 return changed, root
             def _insert_into_block(index, level, block, current_rev, current_hex):
                 """insert a new revision in a block
                 index: the index we are adding revision for
                 level: the depth of the current block in the trie
                 block: the block currently being considered
                 current_rev: the revision number we are adding
                 current_hex: the hexadecimal representation of the of that revision
                 """
                 changed = 1
                 if block.ondisk_id is not None:
                     block.ondisk_id = None
                 hex_digit = _to_int(current_hex[level : level + 1])
                 entry = block.get(hex_digit)
                 if entry is None:
                     # no entry, simply store the revision number
                     block[hex_digit] = current_rev
                 elif isinstance(entry, dict):
                     # need to recurse to an underlying block
                     changed += _insert_into_block(
                         index, level + 1, entry, current_rev, current_hex
                     )
                 else:
                     # collision with a previously unique prefix, inserting new
                     # vertices to fit both entry.
                     other_hex = nodemod.hex(index[entry][7])
                     other_rev = entry
                     new = Block()
                     block[hex_digit] = new
                     _insert_into_block(index, level + 1, new, other_rev, other_hex)
                     _insert_into_block(index, level + 1, new, current_rev, current_hex)
                 return changed
             def _persist_trie(root, existing_idx=None):
                 """turn a nodemap trie into persistent binary data
                 See `_build_trie` for nodemap trie structure"""
                 block_map = {}
                 if existing_idx is not None:
                     base_idx = existing_idx + 1
                 else:
                     base_idx = 0
                 chunks = []
                 for tn in _walk_trie(root):
                     if tn.ondisk_id is not None:
                         block_map[id(tn)] = tn.ondisk_id
                     else:
                         block_map[id(tn)] = len(chunks) + base_idx
                         chunks.append(_persist_block(tn, block_map))
                 return b''.join(chunks)
             def _walk_trie(block):
                 """yield all the block in a trie
                 Children blocks are always yield before their parent block.
                 """
                 for (_, item) in sorted(block.items()):
                     if isinstance(item, dict):
                         for sub_block in _walk_trie(item):
                             yield sub_block
                 yield block
             def _persist_block(block_node, block_map):
                 """produce persistent binary data for a single block
                 Children block are assumed to be already persisted and present in
                 block_map.
                 """
                 data = tuple(_to_value(v, block_map) for v in block_node)
                 return S_BLOCK.pack(*data)
             def _to_value(item, block_map):
                 """persist any value as an integer"""
                 if item is None:
                     return NO_ENTRY
                 elif isinstance(item, dict):
                     return block_map[id(item)]
                 else:
                     return _transform_rev(item)
             def parse_data(data):
                 """parse parse nodemap data into a nodemap Trie"""
                 if (len(data) % S_BLOCK.size) != 0:
                     msg = "nodemap data size is not a multiple of block size (%d): %d"
                     raise error.Abort(msg % (S_BLOCK.size, len(data)))
                 if not data:
                     return Block(), None
                 block_map = {}
                 new_blocks = []
                 for i in range(0, len(data), S_BLOCK.size):
                     block = Block()
                     block.ondisk_id = len(block_map)
                     block_map[block.ondisk_id] = block
                     block_data = data[i : i + S_BLOCK.size]
                     values = S_BLOCK.unpack(block_data)
                     new_blocks.append((block, values))
                 for b, values in new_blocks:
                     for idx, v in enumerate(values):
                         if v == NO_ENTRY:
                             continue
                         elif v >= 0:
                             b[idx] = block_map[v]
                         else:
                             b[idx] = _transform_rev(v)
                 return block, i // S_BLOCK.size
             # debug utility
             def check_data(ui, index, data):
                 """verify that the provided nodemap data are valid for the given idex"""
                 ret = 0
                 ui.status((b"revision in index:   %d\n") % len(index))
                 root, __ = parse_data(data)
                 all_revs = set(_all_revisions(root))
                 ui.status((b"revision in nodemap: %d\n") % len(all_revs))
                 for r in range(len(index)):
                     if r not in all_revs:
                         msg = b"  revision missing from nodemap: %d\n" % r
                         ui.write_err(msg)
                         ret = 1
                     else:
                         all_revs.remove(r)
                     nm_rev = _find_node(root, nodemod.hex(index[r][7]))
                     if nm_rev is None:
                         msg = b"  revision node does not match any entries: %d\n" % r
                         ui.write_err(msg)
                         ret = 1
                     elif nm_rev != r:
                         msg = (
                             b"  revision node does not match the expected revision: "
                             b"%d != %d\n" % (r, nm_rev)
                         )
                         ui.write_err(msg)
                         ret = 1
                 if all_revs:
                     for r in sorted(all_revs):
                         msg = b"  extra revision in  nodemap: %d\n" % r
                         ui.write_err(msg)
                     ret = 1
                 return ret
             def _all_revisions(root):
                 """return all revisions stored in a Trie"""
                 for block in _walk_trie(root):
                     for v in block:
                         if v is None or isinstance(v, Block):
                             continue
                         yield v
             def _find_node(block, node):
                 """find the revision associated with a given node"""
                 entry = block.get(_to_int(node[0:1]))
                 if isinstance(entry, dict):
                     return _find_node(entry, node[1:])
                 return entry