upstream/mercurial-mirror Commit - r51972:15a50bfa

1

# revlog.py - storage back-end for mercurial

1

# revlog.py - storage back-end for mercurial

2

# coding: utf8

2

# coding: utf8

3

#

3

#

4

5

#

5

#

6

# This software may be used and distributed according to the terms of the

6

# This software may be used and distributed according to the terms of the

7

# GNU General Public License version 2 or any later version.

7

# GNU General Public License version 2 or any later version.

8

9

"""Storage back-end for Mercurial.

9

"""Storage back-end for Mercurial.

10

11

This provides efficient delta storage with O(1) retrieve and append

11

This provides efficient delta storage with O(1) retrieve and append

12

and O(changes) merge between branches.

12

and O(changes) merge between branches.

13

"""

13

"""

14

15

16

import binascii

16

import binascii

17

import collections

17

import collections

18

import contextlib

18

import contextlib

19

import io

19

import io

20

import os

20

import os

21

import struct

21

import struct

22

import weakref

22

import weakref

23

import zlib

23

import zlib

24

25

# import stuff from node for others to import from revlog

25

# import stuff from node for others to import from revlog

26

from .node import (

26

from .node import (

27

bin,

27

bin,

28

hex,

28

hex,

29

nullrev,

29

nullrev,

30

sha1nodeconstants,

30

sha1nodeconstants,

31

short,

31

short,

32

wdirrev,

32

wdirrev,

33

)

33

)

34

from .i18n import _

34

from .i18n import _

35

from .revlogutils.constants import (

35

from .revlogutils.constants import (

36

ALL_KINDS,

36

ALL_KINDS,

37

CHANGELOGV2,

37

CHANGELOGV2,

38

COMP_MODE_DEFAULT,

38

COMP_MODE_DEFAULT,

39

COMP_MODE_INLINE,

39

COMP_MODE_INLINE,

40

COMP_MODE_PLAIN,

40

COMP_MODE_PLAIN,

41

DELTA_BASE_REUSE_NO,

41

DELTA_BASE_REUSE_NO,

42

DELTA_BASE_REUSE_TRY,

42

DELTA_BASE_REUSE_TRY,

43

ENTRY_RANK,

43

ENTRY_RANK,

44

FEATURES_BY_VERSION,

44

FEATURES_BY_VERSION,

45

FLAG_GENERALDELTA,

45

FLAG_GENERALDELTA,

46

FLAG_INLINE_DATA,

46

FLAG_INLINE_DATA,

47

INDEX_HEADER,

47

INDEX_HEADER,

48

KIND_CHANGELOG,

48

KIND_CHANGELOG,

49

KIND_FILELOG,

49

KIND_FILELOG,

50

RANK_UNKNOWN,

50

RANK_UNKNOWN,

51

REVLOGV0,

51

REVLOGV0,

52

REVLOGV1,

52

REVLOGV1,

53

REVLOGV1_FLAGS,

53

REVLOGV1_FLAGS,

54

REVLOGV2,

54

REVLOGV2,

55

REVLOGV2_FLAGS,

55

REVLOGV2_FLAGS,

56

REVLOG_DEFAULT_FLAGS,

56

REVLOG_DEFAULT_FLAGS,

57

REVLOG_DEFAULT_FORMAT,

57

REVLOG_DEFAULT_FORMAT,

58

REVLOG_DEFAULT_VERSION,

58

REVLOG_DEFAULT_VERSION,

59

SUPPORTED_FLAGS,

59

SUPPORTED_FLAGS,

60

)

60

)

61

from .revlogutils.flagutil import (

61

from .revlogutils.flagutil import (

62

REVIDX_DEFAULT_FLAGS,

62

REVIDX_DEFAULT_FLAGS,

63

REVIDX_ELLIPSIS,

63

REVIDX_ELLIPSIS,

64

REVIDX_EXTSTORED,

64

REVIDX_EXTSTORED,

65

REVIDX_FLAGS_ORDER,

65

REVIDX_FLAGS_ORDER,

66

REVIDX_HASCOPIESINFO,

66

REVIDX_HASCOPIESINFO,

67

REVIDX_ISCENSORED,

67

REVIDX_ISCENSORED,

68

REVIDX_RAWTEXT_CHANGING_FLAGS,

68

REVIDX_RAWTEXT_CHANGING_FLAGS,

69

)

69

)

70

from .thirdparty import attr

70

from .thirdparty import attr

71

from . import (

71

from . import (

72

ancestor,

72

ancestor,

73

dagop,

73

dagop,

74

error,

74

error,

75

mdiff,

75

mdiff,

76

policy,

76

policy,

77

pycompat,

77

pycompat,

78

revlogutils,

78

revlogutils,

79

templatefilters,

79

templatefilters,

80

util,

80

util,

81

)

81

)

82

from .interfaces import (

82

from .interfaces import (

83

repository,

83

repository,

84

util as interfaceutil,

84

util as interfaceutil,

85

)

85

)

86

from .revlogutils import (

86

from .revlogutils import (

87

deltas as deltautil,

87

deltas as deltautil,

88

docket as docketutil,

88

docket as docketutil,

89

flagutil,

89

flagutil,

90

nodemap as nodemaputil,

90

nodemap as nodemaputil,

91

randomaccessfile,

91

randomaccessfile,

92

revlogv0,

92

revlogv0,

93

rewrite,

93

rewrite,

94

sidedata as sidedatautil,

94

sidedata as sidedatautil,

95

)

95

)

96

from .utils import (

96

from .utils import (

97

storageutil,

97

storageutil,

98

stringutil,

98

stringutil,

99

)

99

)

100

101

# blanked usage of all the name to prevent pyflakes constraints

101

# blanked usage of all the name to prevent pyflakes constraints

102

# We need these name available in the module for extensions.

102

# We need these name available in the module for extensions.

103

104

REVLOGV0

104

REVLOGV0

105

REVLOGV1

105

REVLOGV1

106

REVLOGV2

106

REVLOGV2

107

CHANGELOGV2

107

CHANGELOGV2

108

FLAG_INLINE_DATA

108

FLAG_INLINE_DATA

109

FLAG_GENERALDELTA

109

FLAG_GENERALDELTA

110

REVLOG_DEFAULT_FLAGS

110

REVLOG_DEFAULT_FLAGS

111

REVLOG_DEFAULT_FORMAT

111

REVLOG_DEFAULT_FORMAT

112

REVLOG_DEFAULT_VERSION

112

REVLOG_DEFAULT_VERSION

113

REVLOGV1_FLAGS

113

REVLOGV1_FLAGS

114

REVLOGV2_FLAGS

114

REVLOGV2_FLAGS

115

REVIDX_ISCENSORED

115

REVIDX_ISCENSORED

116

REVIDX_ELLIPSIS

116

REVIDX_ELLIPSIS

117

REVIDX_HASCOPIESINFO

117

REVIDX_HASCOPIESINFO

118

REVIDX_EXTSTORED

118

REVIDX_EXTSTORED

119

REVIDX_DEFAULT_FLAGS

119

REVIDX_DEFAULT_FLAGS

120

REVIDX_FLAGS_ORDER

120

REVIDX_FLAGS_ORDER

121

REVIDX_RAWTEXT_CHANGING_FLAGS

121

REVIDX_RAWTEXT_CHANGING_FLAGS

122

123

parsers = policy.importmod('parsers')

123

parsers = policy.importmod('parsers')

124

rustancestor = policy.importrust('ancestor')

124

rustancestor = policy.importrust('ancestor')

125

rustdagop = policy.importrust('dagop')

125

rustdagop = policy.importrust('dagop')

126

rustrevlog = policy.importrust('revlog')

126

rustrevlog = policy.importrust('revlog')

127

128

# Aliased for performance.

128

# Aliased for performance.

129

_zlibdecompress = zlib.decompress

129

_zlibdecompress = zlib.decompress

130

131

# max size of inline data embedded into a revlog

131

# max size of inline data embedded into a revlog

132

_maxinline = 131072

132

_maxinline = 131072

133

134

# Flag processors for REVIDX_ELLIPSIS.

134

# Flag processors for REVIDX_ELLIPSIS.

135

def ellipsisreadprocessor(rl, text):

135

def ellipsisreadprocessor(rl, text):

136

return text, False

136

return text, False

137

138

139

def ellipsiswriteprocessor(rl, text):

139

def ellipsiswriteprocessor(rl, text):

140

return text, False

140

return text, False

141

142

143

def ellipsisrawprocessor(rl, text):

143

def ellipsisrawprocessor(rl, text):

144

return False

144

return False

145

146

147

ellipsisprocessor = (

147

ellipsisprocessor = (

148

ellipsisreadprocessor,

148

ellipsisreadprocessor,

149

ellipsiswriteprocessor,

149

ellipsiswriteprocessor,

150

ellipsisrawprocessor,

150

ellipsisrawprocessor,

151

)

151

)

152

153

154

def _verify_revision(rl, skipflags, state, node):

154

def _verify_revision(rl, skipflags, state, node):

155

"""Verify the integrity of the given revlog ``node`` while providing a hook

155

"""Verify the integrity of the given revlog ``node`` while providing a hook

156

point for extensions to influence the operation."""

156

point for extensions to influence the operation."""

157

if skipflags:

157

if skipflags:

158

state[b'skipread'].add(node)

158

state[b'skipread'].add(node)

159

else:

159

else:

160

# Side-effect: read content and verify hash.

160

# Side-effect: read content and verify hash.

161

rl.revision(node)

161

rl.revision(node)

162

163

164

# True if a fast implementation for persistent-nodemap is available

164

# True if a fast implementation for persistent-nodemap is available

165

#

165

#

166

# We also consider we have a "fast" implementation in "pure" python because

166

# We also consider we have a "fast" implementation in "pure" python because

167

# people using pure don't really have performance consideration (and a

167

# people using pure don't really have performance consideration (and a

168

# wheelbarrow of other slowness source)

168

# wheelbarrow of other slowness source)

169

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(

169

HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(

170

parsers, 'BaseIndexObject'

170

parsers, 'BaseIndexObject'

171

)

171

)

172

173

174

@interfaceutil.implementer(repository.irevisiondelta)

174

@interfaceutil.implementer(repository.irevisiondelta)

175

@attr.s(slots=True)

175

@attr.s(slots=True)

176

class revlogrevisiondelta:

176

class revlogrevisiondelta:

177

node = attr.ib()

177

node = attr.ib()

178

p1node = attr.ib()

178

p1node = attr.ib()

179

p2node = attr.ib()

179

p2node = attr.ib()

180

basenode = attr.ib()

180

basenode = attr.ib()

181

flags = attr.ib()

181

flags = attr.ib()

182

baserevisionsize = attr.ib()

182

baserevisionsize = attr.ib()

183

revision = attr.ib()

183

revision = attr.ib()

184

delta = attr.ib()

184

delta = attr.ib()

185

sidedata = attr.ib()

185

sidedata = attr.ib()

186

protocol_flags = attr.ib()

186

protocol_flags = attr.ib()

187

linknode = attr.ib(default=None)

187

linknode = attr.ib(default=None)

188

189

190

@interfaceutil.implementer(repository.iverifyproblem)

190

@interfaceutil.implementer(repository.iverifyproblem)

191

@attr.s(frozen=True)

191

@attr.s(frozen=True)

192

class revlogproblem:

192

class revlogproblem:

193

warning = attr.ib(default=None)

193

warning = attr.ib(default=None)

194

error = attr.ib(default=None)

194

error = attr.ib(default=None)

195

node = attr.ib(default=None)

195

node = attr.ib(default=None)

196

197

198

def parse_index_v1(data, inline):

198

def parse_index_v1(data, inline):

199

# call the C implementation to parse the index data

199

# call the C implementation to parse the index data

200

index, cache = parsers.parse_index2(data, inline)

200

index, cache = parsers.parse_index2(data, inline)

201

return index, cache

201

return index, cache

202

203

204

def parse_index_v2(data, inline):

204

def parse_index_v2(data, inline):

205

# call the C implementation to parse the index data

205

# call the C implementation to parse the index data

206

index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)

206

index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)

207

return index, cache

207

return index, cache

208

209

210

def parse_index_cl_v2(data, inline):

210

def parse_index_cl_v2(data, inline):

211

# call the C implementation to parse the index data

211

# call the C implementation to parse the index data

212

index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)

212

index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)

213

return index, cache

213

return index, cache

214

215

216

if hasattr(parsers, 'parse_index_devel_nodemap'):

216

if hasattr(parsers, 'parse_index_devel_nodemap'):

217

218

def parse_index_v1_nodemap(data, inline):

218

def parse_index_v1_nodemap(data, inline):

219

index, cache = parsers.parse_index_devel_nodemap(data, inline)

219

index, cache = parsers.parse_index_devel_nodemap(data, inline)

220

return index, cache

220

return index, cache

221

222

223

else:

223

else:

224

parse_index_v1_nodemap = None

224

parse_index_v1_nodemap = None

225

226

227

def parse_index_v1_mixed(data, inline):

227

def parse_index_v1_mixed(data, inline):

228

index, cache = parse_index_v1(data, inline)

228

index, cache = parse_index_v1(data, inline)

229

return rustrevlog.MixedIndex(index), cache

229

return rustrevlog.MixedIndex(index), cache

230

231

232

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

232

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

233

# signed integer)

233

# signed integer)

234

_maxentrysize = 0x7FFFFFFF

234

_maxentrysize = 0x7FFFFFFF

235

236

FILE_TOO_SHORT_MSG = _(

236

FILE_TOO_SHORT_MSG = _(

237

b'cannot read from revlog %s;'

237

b'cannot read from revlog %s;'

238

b' expected %d bytes from offset %d, data size is %d'

238

b' expected %d bytes from offset %d, data size is %d'

239

)

239

)

240

241

hexdigits = b'0123456789abcdefABCDEF'

241

hexdigits = b'0123456789abcdefABCDEF'

242

243

244

class _Config:

244

class _Config:

245

def copy(self):

245

def copy(self):

246

return self.__class__(**self.__dict__)

246

return self.__class__(**self.__dict__)

247

248

249

@attr.s()

249

@attr.s()

250

class FeatureConfig(_Config):

250

class FeatureConfig(_Config):

251

"""Hold configuration values about the available revlog features"""

251

"""Hold configuration values about the available revlog features"""

252

253

# the default compression engine

253

# the default compression engine

254

compression_engine = attr.ib(default=b'zlib')

254

compression_engine = attr.ib(default=b'zlib')

255

# compression engines options

255

# compression engines options

256

compression_engine_options = attr.ib(default=attr.Factory(dict))

256

compression_engine_options = attr.ib(default=attr.Factory(dict))

257

258

# can we use censor on this revlog

258

# can we use censor on this revlog

259

censorable = attr.ib(default=False)

259

censorable = attr.ib(default=False)

260

# does this revlog use the "side data" feature

260

# does this revlog use the "side data" feature

261

has_side_data = attr.ib(default=False)

261

has_side_data = attr.ib(default=False)

262

# might remove rank configuration once the computation has no impact

262

# might remove rank configuration once the computation has no impact

263

compute_rank = attr.ib(default=False)

263

compute_rank = attr.ib(default=False)

264

# parent order is supposed to be semantically irrelevant, so we

264

# parent order is supposed to be semantically irrelevant, so we

265

# normally resort parents to ensure that the first parent is non-null,

265

# normally resort parents to ensure that the first parent is non-null,

266

# if there is a non-null parent at all.

266

# if there is a non-null parent at all.

267

# filelog abuses the parent order as flag to mark some instances of

267

# filelog abuses the parent order as flag to mark some instances of

268

# meta-encoded files, so allow it to disable this behavior.

268

# meta-encoded files, so allow it to disable this behavior.

269

canonical_parent_order = attr.ib(default=False)

269

canonical_parent_order = attr.ib(default=False)

270

# can ellipsis commit be used

270

# can ellipsis commit be used

271

enable_ellipsis = attr.ib(default=False)

271

enable_ellipsis = attr.ib(default=False)

272

273

def copy(self):

273

def copy(self):

274

new = super().copy()

274

new = super().copy()

275

new.compression_engine_options = self.compression_engine_options.copy()

275

new.compression_engine_options = self.compression_engine_options.copy()

276

return new

276

return new

277

278

279

@attr.s()

279

@attr.s()

280

class DataConfig(_Config):

280

class DataConfig(_Config):

281

"""Hold configuration value about how the revlog data are read"""

281

"""Hold configuration value about how the revlog data are read"""

282

283

# should we try to open the "pending" version of the revlog

283

# should we try to open the "pending" version of the revlog

284

try_pending = attr.ib(default=False)

284

try_pending = attr.ib(default=False)

285

# should we try to open the "splitted" version of the revlog

285

# should we try to open the "splitted" version of the revlog

286

try_split = attr.ib(default=False)

286

try_split = attr.ib(default=False)

287

# When True, indexfile should be opened with checkambig=True at writing,

287

# When True, indexfile should be opened with checkambig=True at writing,

288

# to avoid file stat ambiguity.

288

# to avoid file stat ambiguity.

289

check_ambig = attr.ib(default=False)

289

check_ambig = attr.ib(default=False)

290

291

# If true, use mmap instead of reading to deal with large index

291

# If true, use mmap instead of reading to deal with large index

292

mmap_large_index = attr.ib(default=False)

292

mmap_large_index = attr.ib(default=False)

293

# how much data is large

293

# how much data is large

294

mmap_index_threshold = attr.ib(default=None)

294

mmap_index_threshold = attr.ib(default=None)

295

# How much data to read and cache into the raw revlog data cache.

295

# How much data to read and cache into the raw revlog data cache.

296

chunk_cache_size = attr.ib(default=65536)

296

chunk_cache_size = attr.ib(default=65536)

297

298

# Allow sparse reading of the revlog data

298

# Allow sparse reading of the revlog data

299

with_sparse_read = attr.ib(default=False)

299

with_sparse_read = attr.ib(default=False)

300

# minimal density of a sparse read chunk

300

# minimal density of a sparse read chunk

301

sr_density_threshold = attr.ib(default=0.50)

301

sr_density_threshold = attr.ib(default=0.50)

302

# minimal size of data we skip when performing sparse read

302

# minimal size of data we skip when performing sparse read

303

sr_min_gap_size = attr.ib(default=262144)

303

sr_min_gap_size = attr.ib(default=262144)

304

305

# are delta encoded against arbitrary bases.

305

# are delta encoded against arbitrary bases.

306

generaldelta = attr.ib(default=False)

306

generaldelta = attr.ib(default=False)

307

308

309

@attr.s()

309

@attr.s()

310

class DeltaConfig(_Config):

310

class DeltaConfig(_Config):

311

"""Hold configuration value about how new delta are computed

311

"""Hold configuration value about how new delta are computed

312

313

Some attributes are duplicated from DataConfig to help havign each object

313

Some attributes are duplicated from DataConfig to help havign each object

314

self contained.

314

self contained.

315

"""

315

"""

316

317

# can delta be encoded against arbitrary bases.

317

# can delta be encoded against arbitrary bases.

318

general_delta = attr.ib(default=False)

318

general_delta = attr.ib(default=False)

319

# Allow sparse writing of the revlog data

319

# Allow sparse writing of the revlog data

320

sparse_revlog = attr.ib(default=False)

320

sparse_revlog = attr.ib(default=False)

321

# maximum length of a delta chain

321

# maximum length of a delta chain

322

max_chain_len = attr.ib(default=None)

322

max_chain_len = attr.ib(default=None)

323

# Maximum distance between delta chain base start and end

323

# Maximum distance between delta chain base start and end

324

max_deltachain_span = attr.ib(default=-1)

324

max_deltachain_span = attr.ib(default=-1)

325

# If `upper_bound_comp` is not None, this is the expected maximal gain from

325

# If `upper_bound_comp` is not None, this is the expected maximal gain from

326

# compression for the data content.

326

# compression for the data content.

327

upper_bound_comp = attr.ib(default=None)

327

upper_bound_comp = attr.ib(default=None)

328

# Should we try a delta against both parent

328

# Should we try a delta against both parent

329

delta_both_parents = attr.ib(default=True)

329

delta_both_parents = attr.ib(default=True)

330

# Test delta base candidate group by chunk of this maximal size.

330

# Test delta base candidate group by chunk of this maximal size.

331

candidate_group_chunk_size = attr.ib(default=0)

331

candidate_group_chunk_size = attr.ib(default=0)

332

# Should we display debug information about delta computation

332

# Should we display debug information about delta computation

333

debug_delta = attr.ib(default=False)

333

debug_delta = attr.ib(default=False)

334

# trust incoming delta by default

334

# trust incoming delta by default

335

lazy_delta = attr.ib(default=True)

335

lazy_delta = attr.ib(default=True)

336

# trust the base of incoming delta by default

336

# trust the base of incoming delta by default

337

lazy_delta_base = attr.ib(default=False)

337

lazy_delta_base = attr.ib(default=False)

338

339

340

class revlog:

340

class revlog:

341

"""

341

"""

342

the underlying revision storage object

342

the underlying revision storage object

343

344

A revlog consists of two parts, an index and the revision data.

344

A revlog consists of two parts, an index and the revision data.

345

346

The index is a file with a fixed record size containing

346

The index is a file with a fixed record size containing

347

information on each revision, including its nodeid (hash), the

347

information on each revision, including its nodeid (hash), the

348

nodeids of its parents, the position and offset of its data within

348

nodeids of its parents, the position and offset of its data within

349

the data file, and the revision it's based on. Finally, each entry

349

the data file, and the revision it's based on. Finally, each entry

350

contains a linkrev entry that can serve as a pointer to external

350

contains a linkrev entry that can serve as a pointer to external

351

data.

351

data.

352

353

The revision data itself is a linear collection of data chunks.

353

The revision data itself is a linear collection of data chunks.

354

Each chunk represents a revision and is usually represented as a

354

Each chunk represents a revision and is usually represented as a

355

delta against the previous chunk. To bound lookup time, runs of

355

delta against the previous chunk. To bound lookup time, runs of

356

deltas are limited to about 2 times the length of the original

356

deltas are limited to about 2 times the length of the original

357

version data. This makes retrieval of a version proportional to

357

version data. This makes retrieval of a version proportional to

358

its size, or O(1) relative to the number of revisions.

358

its size, or O(1) relative to the number of revisions.

359

360

Both pieces of the revlog are written to in an append-only

360

Both pieces of the revlog are written to in an append-only

361

fashion, which means we never need to rewrite a file to insert or

361

fashion, which means we never need to rewrite a file to insert or

362

remove data, and can use some simple techniques to avoid the need

362

remove data, and can use some simple techniques to avoid the need

363

for locking while reading.

363

for locking while reading.

364

365

If checkambig, indexfile is opened with checkambig=True at

365

If checkambig, indexfile is opened with checkambig=True at

366

writing, to avoid file stat ambiguity.

366

writing, to avoid file stat ambiguity.

367

368

If mmaplargeindex is True, and an mmapindexthreshold is set, the

368

If mmaplargeindex is True, and an mmapindexthreshold is set, the

369

index will be mmapped rather than read if it is larger than the

369

index will be mmapped rather than read if it is larger than the

370

configured threshold.

370

configured threshold.

371

372

If censorable is True, the revlog can have censored revisions.

372

If censorable is True, the revlog can have censored revisions.

373

374

If `upperboundcomp` is not None, this is the expected maximal gain from

374

If `upperboundcomp` is not None, this is the expected maximal gain from

375

compression for the data content.

375

compression for the data content.

376

377

`concurrencychecker` is an optional function that receives 3 arguments: a

377

`concurrencychecker` is an optional function that receives 3 arguments: a

378

file handle, a filename, and an expected position. It should check whether

378

file handle, a filename, and an expected position. It should check whether

379

the current position in the file handle is valid, and log/warn/fail (by

379

the current position in the file handle is valid, and log/warn/fail (by

380

raising).

380

raising).

381

382

See mercurial/revlogutils/contants.py for details about the content of an

382

See mercurial/revlogutils/contants.py for details about the content of an

383

index entry.

383

index entry.

384

"""

384

"""

385

386

_flagserrorclass = error.RevlogError

386

_flagserrorclass = error.RevlogError

387

388

@staticmethod

388

@staticmethod

389

def is_inline_index(header_bytes):

389

def is_inline_index(header_bytes):

390

"""Determine if a revlog is inline from the initial bytes of the index"""

390

"""Determine if a revlog is inline from the initial bytes of the index"""

391

header = INDEX_HEADER.unpack(header_bytes)[0]

391

header = INDEX_HEADER.unpack(header_bytes)[0]

392

393

_format_flags = header & ~0xFFFF

393

_format_flags = header & ~0xFFFF

394

_format_version = header & 0xFFFF

394

_format_version = header & 0xFFFF

395

396

features = FEATURES_BY_VERSION[_format_version]

396

features = FEATURES_BY_VERSION[_format_version]

397

return features[b'inline'](_format_flags)

397

return features[b'inline'](_format_flags)

398

399

def __init__(

399

def __init__(

400

self,

400

self,

401

opener,

401

opener,

402

target,

402

target,

403

radix,

403

radix,

404

postfix=None, # only exist for `tmpcensored` now

404

postfix=None, # only exist for `tmpcensored` now

405

checkambig=False,

405

checkambig=False,

406

mmaplargeindex=False,

406

mmaplargeindex=False,

407

censorable=False,

407

censorable=False,

408

upperboundcomp=None,

408

upperboundcomp=None,

409

persistentnodemap=False,

409

persistentnodemap=False,

410

concurrencychecker=None,

410

concurrencychecker=None,

411

trypending=False,

411

trypending=False,

412

try_split=False,

412

try_split=False,

413

canonical_parent_order=True,

413

canonical_parent_order=True,

414

):

414

):

415

"""

415

"""

416

create a revlog object

416

create a revlog object

417

418

opener is a function that abstracts the file opening operation

418

opener is a function that abstracts the file opening operation

419

and can be used to implement COW semantics or the like.

419

and can be used to implement COW semantics or the like.

420

421

`target`: a (KIND, ID) tuple that identify the content stored in

421

`target`: a (KIND, ID) tuple that identify the content stored in

422

this revlog. It help the rest of the code to understand what the revlog

422

this revlog. It help the rest of the code to understand what the revlog

423

is about without having to resort to heuristic and index filename

423

is about without having to resort to heuristic and index filename

424

analysis. Note: that this must be reliably be set by normal code, but

424

analysis. Note: that this must be reliably be set by normal code, but

425

that test, debug, or performance measurement code might not set this to

425

that test, debug, or performance measurement code might not set this to

426

accurate value.

426

accurate value.

427

"""

427

"""

428

self.upperboundcomp = upperboundcomp

428

self.upperboundcomp = upperboundcomp

429

430

self.radix = radix

430

self.radix = radix

431

432

self._docket_file = None

432

self._docket_file = None

433

self._indexfile = None

433

self._indexfile = None

434

self._datafile = None

434

self._datafile = None

435

self._sidedatafile = None

435

self._sidedatafile = None

436

self._nodemap_file = None

436

self._nodemap_file = None

437

self.postfix = postfix

437

self.postfix = postfix

438

self._trypending = trypending

438

self._trypending = trypending

439

self._try_split = try_split

439

self._try_split = try_split

440

self.opener = opener

440

self.opener = opener

441

if persistentnodemap:

441

if persistentnodemap:

442

self._nodemap_file = nodemaputil.get_nodemap_file(self)

442

self._nodemap_file = nodemaputil.get_nodemap_file(self)

443

444

assert target[0] in ALL_KINDS

444

assert target[0] in ALL_KINDS

445

assert len(target) == 2

445

assert len(target) == 2

446

self.target = target

446

self.target = target

447

if b'feature-config' in self.opener.options:

447

if b'feature-config' in self.opener.options:

448

self.feature_config = self.opener.options[b'feature-config'].copy()

448

self.feature_config = self.opener.options[b'feature-config'].copy()

449

else:

449

else:

450

self.feature_config = FeatureConfig()

450

self.feature_config = FeatureConfig()

451

self.feature_config.censorable = censorable

451

self.feature_config.censorable = censorable

452

self.feature_config.canonical_parent_order = canonical_parent_order

452

self.feature_config.canonical_parent_order = canonical_parent_order

453

if b'data-config' in self.opener.options:

453

if b'data-config' in self.opener.options:

454

self.data_config = self.opener.options[b'data-config'].copy()

454

self.data_config = self.opener.options[b'data-config'].copy()

455

else:

455

else:

456

self.data_config = DataConfig()

456

self.data_config = DataConfig()

457

self.data_config.check_ambig = checkambig

457

self.data_config.check_ambig = checkambig

458

self.data_config.mmap_large_index = mmaplargeindex

458

self.data_config.mmap_large_index = mmaplargeindex

459

if b'delta-config' in self.opener.options:

459

if b'delta-config' in self.opener.options:

460

self.delta_config = self.opener.options[b'delta-config'].copy()

460

self.delta_config = self.opener.options[b'delta-config'].copy()

461

else:

461

else:

462

self.delta_config = DeltaConfig()

462

self.delta_config = DeltaConfig()

463

464

# 3-tuple of (node, rev, text) for a raw revision.

464

# 3-tuple of (node, rev, text) for a raw revision.

465

self._revisioncache = None

465

self._revisioncache = None

466

# Maps rev to chain base rev.

466

# Maps rev to chain base rev.

467

self._chainbasecache = util.lrucachedict(100)

467

self._chainbasecache = util.lrucachedict(100)

468

# 2-tuple of (offset, data) of raw data from the revlog at an offset.

468

# 2-tuple of (offset, data) of raw data from the revlog at an offset.

469

self._chunkcache = (0, b'')

469

self._chunkcache = (0, b'')

470

471

self.index = None

471

self.index = None

472

self._docket = None

472

self._docket = None

473

self._nodemap_docket = None

473

self._nodemap_docket = None

474

# Mapping of partial identifiers to full nodes.

474

# Mapping of partial identifiers to full nodes.

475

self._pcache = {}

475

self._pcache = {}

476

477

# other optionnals features

477

# other optionnals features

478

479

# Make copy of flag processors so each revlog instance can support

479

# Make copy of flag processors so each revlog instance can support

480

# custom flags.

480

# custom flags.

481

self._flagprocessors = dict(flagutil.flagprocessors)

481

self._flagprocessors = dict(flagutil.flagprocessors)

482

483

# 3-tuple of file handles being used for active writing.

483

# 3-tuple of file handles being used for active writing.

484

self._writinghandles = None

484

self._writinghandles = None

485

# prevent nesting of addgroup

485

# prevent nesting of addgroup

486

self._adding_group = None

486

self._adding_group = None

487

488

self._loadindex()

488

self._loadindex()

489

490

self._concurrencychecker = concurrencychecker

490

self._concurrencychecker = concurrencychecker

491

492

@property

492

@property

493

def _generaldelta(self):

493

def _generaldelta(self):

494

"""temporary compatibility proxy"""

494

"""temporary compatibility proxy"""

495

util.nouideprecwarn(

495

util.nouideprecwarn(

496

b"use revlog.delta_config.general_delta", b"6.6", stacklevel=2

496

b"use revlog.delta_config.general_delta", b"6.6", stacklevel=2

497

)

497

)

498

return self.delta_config.general_delta

498

return self.delta_config.general_delta

499

500

@property

500

@property

501

def _checkambig(self):

501

def _checkambig(self):

502

"""temporary compatibility proxy"""

502

"""temporary compatibility proxy"""

503

util.nouideprecwarn(

503

util.nouideprecwarn(

504

b"use revlog.data_config.checkambig", b"6.6", stacklevel=2

504

b"use revlog.data_config.checkambig", b"6.6", stacklevel=2

505

)

505

)

506

return self.data_config.check_ambig

506

return self.data_config.check_ambig

507

508

@property

508

@property

509

def _mmaplargeindex(self):

509

def _mmaplargeindex(self):

510

"""temporary compatibility proxy"""

510

"""temporary compatibility proxy"""

511

util.nouideprecwarn(

511

util.nouideprecwarn(

512

b"use revlog.data_config.mmap_large_index", b"6.6", stacklevel=2

512

b"use revlog.data_config.mmap_large_index", b"6.6", stacklevel=2

513

)

513

)

514

return self.data_config.mmap_large_index

514

return self.data_config.mmap_large_index

515

516

@property

516

@property

517

def _censorable(self):

517

def _censorable(self):

518

"""temporary compatibility proxy"""

518

"""temporary compatibility proxy"""

519

util.nouideprecwarn(

519

util.nouideprecwarn(

520

b"use revlog.feature_config.censorable", b"6.6", stacklevel=2

520

b"use revlog.feature_config.censorable", b"6.6", stacklevel=2

521

)

521

)

522

return self.feature_config.censorable

522

return self.feature_config.censorable

523

524

@property

524

@property

525

def _chunkcachesize(self):

525

def _chunkcachesize(self):

526

"""temporary compatibility proxy"""

526

"""temporary compatibility proxy"""

527

util.nouideprecwarn(

527

util.nouideprecwarn(

528

b"use revlog.data_config.chunk_cache_size", b"6.6", stacklevel=2

528

b"use revlog.data_config.chunk_cache_size", b"6.6", stacklevel=2

529

)

529

)

530

return self.data_config.chunk_cache_size

530

return self.data_config.chunk_cache_size

531

532

@property

532

@property

533

def _maxchainlen(self):

533

def _maxchainlen(self):

534

"""temporary compatibility proxy"""

534

"""temporary compatibility proxy"""

535

util.nouideprecwarn(

535

util.nouideprecwarn(

536

b"use revlog.delta_config.max_chain_len", b"6.6", stacklevel=2

536

b"use revlog.delta_config.max_chain_len", b"6.6", stacklevel=2

537

)

537

)

538

return self.delta_config.max_chain_len

538

return self.delta_config.max_chain_len

539

540

@property

540

@property

541

def _deltabothparents(self):

541

def _deltabothparents(self):

542

"""temporary compatibility proxy"""

542

"""temporary compatibility proxy"""

543

util.nouideprecwarn(

543

util.nouideprecwarn(

544

b"use revlog.delta_config.delta_both_parents", b"6.6", stacklevel=2

544

b"use revlog.delta_config.delta_both_parents", b"6.6", stacklevel=2

545

)

545

)

546

return self.delta_config.delta_both_parents

546

return self.delta_config.delta_both_parents

547

548

@property

548

@property

549

def _candidate_group_chunk_size(self):

549

def _candidate_group_chunk_size(self):

550

"""temporary compatibility proxy"""

550

"""temporary compatibility proxy"""

551

util.nouideprecwarn(

551

util.nouideprecwarn(

552

b"use revlog.delta_config.candidate_group_chunk_size",

552

b"use revlog.delta_config.candidate_group_chunk_size",

553

b"6.6",

553

b"6.6",

554

stacklevel=2,

554

stacklevel=2,

555

)

555

)

556

return self.delta_config.candidate_group_chunk_size

556

return self.delta_config.candidate_group_chunk_size

557

558

@property

558

@property

559

def _debug_delta(self):

559

def _debug_delta(self):

560

"""temporary compatibility proxy"""

560

"""temporary compatibility proxy"""

561

util.nouideprecwarn(

561

util.nouideprecwarn(

562

b"use revlog.delta_config.debug_delta", b"6.6", stacklevel=2

562

b"use revlog.delta_config.debug_delta", b"6.6", stacklevel=2

563

)

563

)

564

return self.delta_config.debug_delta

564

return self.delta_config.debug_delta

565

566

@property

566

@property

567

def _compengine(self):

567

def _compengine(self):

568

"""temporary compatibility proxy"""

568

"""temporary compatibility proxy"""

569

util.nouideprecwarn(

569

util.nouideprecwarn(

570

b"use revlog.feature_config.compression_engine",

570

b"use revlog.feature_config.compression_engine",

571

b"6.6",

571

b"6.6",

572

stacklevel=2,

572

stacklevel=2,

573

)

573

)

574

return self.feature_config.compression_engine

574

return self.feature_config.compression_engine

575

576

@property

576

@property

577

def _compengineopts(self):

577

def _compengineopts(self):

578

"""temporary compatibility proxy"""

578

"""temporary compatibility proxy"""

579

util.nouideprecwarn(

579

util.nouideprecwarn(

580

b"use revlog.feature_config.compression_engine_options",

580

b"use revlog.feature_config.compression_engine_options",

581

b"6.6",

581

b"6.6",

582

stacklevel=2,

582

stacklevel=2,

583

)

583

)

584

return self.feature_config.compression_engine_options

584

return self.feature_config.compression_engine_options

585

586

@property

586

@property

587

def _maxdeltachainspan(self):

587

def _maxdeltachainspan(self):

588

"""temporary compatibility proxy"""

588

"""temporary compatibility proxy"""

589

util.nouideprecwarn(

589

util.nouideprecwarn(

590

b"use revlog.delta_config.max_deltachain_span", b"6.6", stacklevel=2

590

b"use revlog.delta_config.max_deltachain_span", b"6.6", stacklevel=2

591

)

591

)

592

return self.delta_config.max_deltachain_span

592

return self.delta_config.max_deltachain_span

593

594

@property

594

@property

595

def _withsparseread(self):

595

def _withsparseread(self):

596

"""temporary compatibility proxy"""

596

"""temporary compatibility proxy"""

597

util.nouideprecwarn(

597

util.nouideprecwarn(

598

b"use revlog.data_config.with_sparse_read", b"6.6", stacklevel=2

598

b"use revlog.data_config.with_sparse_read", b"6.6", stacklevel=2

599

)

599

)

600

return self.data_config.with_sparse_read

600

return self.data_config.with_sparse_read

601

602

@property

602

@property

603

def _sparserevlog(self):

603

def _sparserevlog(self):

604

"""temporary compatibility proxy"""

604

"""temporary compatibility proxy"""

605

util.nouideprecwarn(

605

util.nouideprecwarn(

606

b"use revlog.delta_config.sparse_revlog", b"6.6", stacklevel=2

606

b"use revlog.delta_config.sparse_revlog", b"6.6", stacklevel=2

607

)

607

)

608

return self.delta_config.sparse_revlog

608

return self.delta_config.sparse_revlog

609

610

@property

610

@property

611

def hassidedata(self):

611

def hassidedata(self):

612

"""temporary compatibility proxy"""

612

"""temporary compatibility proxy"""

613

util.nouideprecwarn(

613

util.nouideprecwarn(

614

b"use revlog.feature_config.has_side_data", b"6.6", stacklevel=2

614

b"use revlog.feature_config.has_side_data", b"6.6", stacklevel=2

615

)

615

)

616

return self.feature_config.has_side_data

616

return self.feature_config.has_side_data

617

618

@property

618

@property

619

def _srdensitythreshold(self):

619

def _srdensitythreshold(self):

620

"""temporary compatibility proxy"""

620

"""temporary compatibility proxy"""

621

util.nouideprecwarn(

621

util.nouideprecwarn(

622

b"use revlog.data_config.sr_density_threshold",

622

b"use revlog.data_config.sr_density_threshold",

623

b"6.6",

623

b"6.6",

624

stacklevel=2,

624

stacklevel=2,

625

)

625

)

626

return self.data_config.sr_density_threshold

626

return self.data_config.sr_density_threshold

627

628

@property

628

@property

629

def _srmingapsize(self):

629

def _srmingapsize(self):

630

"""temporary compatibility proxy"""

630

"""temporary compatibility proxy"""

631

util.nouideprecwarn(

631

util.nouideprecwarn(

632

b"use revlog.data_config.sr_min_gap_size", b"6.6", stacklevel=2

632

b"use revlog.data_config.sr_min_gap_size", b"6.6", stacklevel=2

633

)

633

)

634

return self.data_config.sr_min_gap_size

634

return self.data_config.sr_min_gap_size

635

636

@property

636

@property

637

def _compute_rank(self):

637

def _compute_rank(self):

638

"""temporary compatibility proxy"""

638

"""temporary compatibility proxy"""

639

util.nouideprecwarn(

639

util.nouideprecwarn(

640

b"use revlog.feature_config.compute_rank", b"6.6", stacklevel=2

640

b"use revlog.feature_config.compute_rank", b"6.6", stacklevel=2

641

)

641

)

642

return self.feature_config.compute_rank

642

return self.feature_config.compute_rank

643

644

@property

644

@property

645

def canonical_parent_order(self):

645

def canonical_parent_order(self):

646

"""temporary compatibility proxy"""

646

"""temporary compatibility proxy"""

647

util.nouideprecwarn(

647

util.nouideprecwarn(

648

b"use revlog.feature_config.canonical_parent_order",

648

b"use revlog.feature_config.canonical_parent_order",

649

b"6.6",

649

b"6.6",

650

stacklevel=2,

650

stacklevel=2,

651

)

651

)

652

return self.feature_config.canonical_parent_order

652

return self.feature_config.canonical_parent_order

653

654

@property

654

@property

655

def _lazydelta(self):

655

def _lazydelta(self):

656

"""temporary compatibility proxy"""

656

"""temporary compatibility proxy"""

657

util.nouideprecwarn(

657

util.nouideprecwarn(

658

b"use revlog.delta_config.lazy_delta", b"6.6", stacklevel=2

658

b"use revlog.delta_config.lazy_delta", b"6.6", stacklevel=2

659

)

659

)

660

return self.delta_config.lazy_delta

660

return self.delta_config.lazy_delta

661

662

@property

662

@property

663

def _lazydeltabase(self):

663

def _lazydeltabase(self):

664

"""temporary compatibility proxy"""

664

"""temporary compatibility proxy"""

665

util.nouideprecwarn(

665

util.nouideprecwarn(

666

b"use revlog.delta_config.lazy_delta_base", b"6.6", stacklevel=2

666

b"use revlog.delta_config.lazy_delta_base", b"6.6", stacklevel=2

667

)

667

)

668

return self.delta_config.lazy_delta_base

668

return self.delta_config.lazy_delta_base

669

670

def _init_opts(self):

670

def _init_opts(self):

671

"""process options (from above/config) to setup associated default revlog mode

671

"""process options (from above/config) to setup associated default revlog mode

672

673

These values might be affected when actually reading on disk information.

673

These values might be affected when actually reading on disk information.

674

675

The relevant values are returned for use in _loadindex().

675

The relevant values are returned for use in _loadindex().

676

677

* newversionflags:

677

* newversionflags:

678

version header to use if we need to create a new revlog

678

version header to use if we need to create a new revlog

679

680

* mmapindexthreshold:

680

* mmapindexthreshold:

681

minimal index size for start to use mmap

681

minimal index size for start to use mmap

682

683

* force_nodemap:

683

* force_nodemap:

684

force the usage of a "development" version of the nodemap code

684

force the usage of a "development" version of the nodemap code

685

"""

685

"""

686

opts = self.opener.options

686

opts = self.opener.options

687

688

if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:

688

if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:

689

new_header = CHANGELOGV2

689

new_header = CHANGELOGV2

690

compute_rank = opts.get(b'changelogv2.compute-rank', True)

690

compute_rank = opts.get(b'changelogv2.compute-rank', True)

691

self.feature_config.compute_rank = compute_rank

691

self.feature_config.compute_rank = compute_rank

692

elif b'revlogv2' in opts:

692

elif b'revlogv2' in opts:

693

new_header = REVLOGV2

693

new_header = REVLOGV2

694

elif b'revlogv1' in opts:

694

elif b'revlogv1' in opts:

695

new_header = REVLOGV1 | FLAG_INLINE_DATA

695

new_header = REVLOGV1 | FLAG_INLINE_DATA

696

if b'generaldelta' in opts:

696

if b'generaldelta' in opts:

697

new_header |= FLAG_GENERALDELTA

697

new_header |= FLAG_GENERALDELTA

698

elif b'revlogv0' in self.opener.options:

698

elif b'revlogv0' in self.opener.options:

699

new_header = REVLOGV0

699

new_header = REVLOGV0

700

else:

700

else:

701

new_header = REVLOG_DEFAULT_VERSION

701

new_header = REVLOG_DEFAULT_VERSION

702

703

mmapindexthreshold = None

703

mmapindexthreshold = None

704

if self.data_config.mmap_large_index:

704

if self.data_config.mmap_large_index:

705

mmapindexthreshold = self.data_config.mmap_index_threshold

705

mmapindexthreshold = self.data_config.mmap_index_threshold

706

if self.feature_config.enable_ellipsis:

706

if self.feature_config.enable_ellipsis:

707

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

707

self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor

708

709

# revlog v0 doesn't have flag processors

709

# revlog v0 doesn't have flag processors

710

for flag, processor in opts.get(b'flagprocessors', {}).items():

710

for flag, processor in opts.get(b'flagprocessors', {}).items():

711

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

711

flagutil.insertflagprocessor(flag, processor, self._flagprocessors)

712

713

chunk_cache_size = self.data_config.chunk_cache_size

713

chunk_cache_size = self.data_config.chunk_cache_size

714

if chunk_cache_size <= 0:

714

if chunk_cache_size <= 0:

715

raise error.RevlogError(

715

raise error.RevlogError(

716

_(b'revlog chunk cache size %r is not greater than 0')

716

_(b'revlog chunk cache size %r is not greater than 0')

717

% chunk_cache_size

717

% chunk_cache_size

718

)

718

)

719

elif chunk_cache_size & (chunk_cache_size - 1):

719

elif chunk_cache_size & (chunk_cache_size - 1):

720

raise error.RevlogError(

720

raise error.RevlogError(

721

_(b'revlog chunk cache size %r is not a power of 2')

721

_(b'revlog chunk cache size %r is not a power of 2')

722

% chunk_cache_size

722

% chunk_cache_size

723

)

723

)

724

force_nodemap = opts.get(b'devel-force-nodemap', False)

724

force_nodemap = opts.get(b'devel-force-nodemap', False)

725

return new_header, mmapindexthreshold, force_nodemap

725

return new_header, mmapindexthreshold, force_nodemap

726

727

def _get_data(self, filepath, mmap_threshold, size=None):

727

def _get_data(self, filepath, mmap_threshold, size=None):

728

"""return a file content with or without mmap

728

"""return a file content with or without mmap

729

730

If the file is missing return the empty string"""

730

If the file is missing return the empty string"""

731

try:

731

try:

732

with self.opener(filepath) as fp:

732

with self.opener(filepath) as fp:

733

if mmap_threshold is not None:

733

if mmap_threshold is not None:

734

file_size = self.opener.fstat(fp).st_size

734

file_size = self.opener.fstat(fp).st_size

735

if file_size >= mmap_threshold:

735

if file_size >= mmap_threshold:

736

if size is not None:

736

if size is not None:

737

# avoid potentiel mmap crash

737

# avoid potentiel mmap crash

738

size = min(file_size, size)

738

size = min(file_size, size)

739

# TODO: should .close() to release resources without

739

# TODO: should .close() to release resources without

740

# relying on Python GC

740

# relying on Python GC

741

if size is None:

741

if size is None:

742

return util.buffer(util.mmapread(fp))

742

return util.buffer(util.mmapread(fp))

743

else:

743

else:

744

return util.buffer(util.mmapread(fp, size))

744

return util.buffer(util.mmapread(fp, size))

745

if size is None:

745

if size is None:

746

return fp.read()

746

return fp.read()

747

else:

747

else:

748

return fp.read(size)

748

return fp.read(size)

749

except FileNotFoundError:

749

except FileNotFoundError:

750

return b''

750

return b''

751

752

def get_streams(self, max_linkrev, force_inline=False):

752

def get_streams(self, max_linkrev, force_inline=False):

753

"""return a list of streams that represent this revlog

753

"""return a list of streams that represent this revlog

754

755

This is used by stream-clone to do bytes to bytes copies of a repository.

755

This is used by stream-clone to do bytes to bytes copies of a repository.

756

757

This streams data for all revisions that refer to a changelog revision up

757

This streams data for all revisions that refer to a changelog revision up

758

to `max_linkrev`.

758

to `max_linkrev`.

759

760

If `force_inline` is set, it enforces that the stream will represent an inline revlog.

760

If `force_inline` is set, it enforces that the stream will represent an inline revlog.

761

762

It returns is a list of three-tuple:

762

It returns is a list of three-tuple:

763

764

[

764

[

765

(filename, bytes_stream, stream_size),

765

(filename, bytes_stream, stream_size),

766

…

766

…

767

]

767

]

768

"""

768

"""

769

n = len(self)

769

n = len(self)

770

index = self.index

770

index = self.index

771

while n > 0:

771

while n > 0:

772

linkrev = index[n - 1][4]

772

linkrev = index[n - 1][4]

773

if linkrev < max_linkrev:

773

if linkrev < max_linkrev:

774

break

774

break

775

# note: this loop will rarely go through multiple iterations, since

775

# note: this loop will rarely go through multiple iterations, since

776

# it only traverses commits created during the current streaming

776

# it only traverses commits created during the current streaming

777

# pull operation.

777

# pull operation.

778

#

778

#

779

# If this become a problem, using a binary search should cap the

779

# If this become a problem, using a binary search should cap the

780

# runtime of this.

780

# runtime of this.

781

n = n - 1

781

n = n - 1

782

if n == 0:

782

if n == 0:

783

# no data to send

783

# no data to send

784

return []

784

return []

785

index_size = n * index.entry_size

785

index_size = n * index.entry_size

786

data_size = self.end(n - 1)

786

data_size = self.end(n - 1)

787

788

# XXX we might have been split (or stripped) since the object

788

# XXX we might have been split (or stripped) since the object

789

# initialization, We need to close this race too, but having a way to

789

# initialization, We need to close this race too, but having a way to

790

# pre-open the file we feed to the revlog and never closing them before

790

# pre-open the file we feed to the revlog and never closing them before

791

# we are done streaming.

791

# we are done streaming.

792

793

if self._inline:

793

if self._inline:

794

795

def get_stream():

795

def get_stream():

796

with self._indexfp() as fp:

796

with self._indexfp() as fp:

797

yield None

797

yield None

798

size = index_size + data_size

798

size = index_size + data_size

799

if size <= 65536:

799

if size <= 65536:

800

yield fp.read(size)

800

yield fp.read(size)

801

else:

801

else:

802

yield from util.filechunkiter(fp, limit=size)

802

yield from util.filechunkiter(fp, limit=size)

803

804

inline_stream = get_stream()

804

inline_stream = get_stream()

805

next(inline_stream)

805

next(inline_stream)

806

return [

806

return [

807

(self._indexfile, inline_stream, index_size + data_size),

807

(self._indexfile, inline_stream, index_size + data_size),

808

]

808

]

809

elif force_inline:

809

elif force_inline:

810

811

def get_stream():

811

def get_stream():

812

with self.reading():

812

with self.reading():

813

yield None

813

yield None

814

815

for rev in range(n):

815

for rev in range(n):

816

idx = self.index.entry_binary(rev)

816

idx = self.index.entry_binary(rev)

817

if rev == 0 and self._docket is None:

817

if rev == 0 and self._docket is None:

818

# re-inject the inline flag

818

# re-inject the inline flag

819

header = self._format_flags

819

header = self._format_flags

820

header |= self._format_version

820

header |= self._format_version

821

header |= FLAG_INLINE_DATA

821

header |= FLAG_INLINE_DATA

822

header = self.index.pack_header(header)

822

header = self.index.pack_header(header)

823

idx = header + idx

823

idx = header + idx

824

yield idx

824

yield idx

825

yield self._getsegmentforrevs(rev, rev)[1]

825

yield self._getsegmentforrevs(rev, rev)[1]

826

827

inline_stream = get_stream()

827

inline_stream = get_stream()

828

next(inline_stream)

828

next(inline_stream)

829

return [

829

return [

830

(self._indexfile, inline_stream, index_size + data_size),

830

(self._indexfile, inline_stream, index_size + data_size),

831

]

831

]

832

else:

832

else:

833

834

def get_index_stream():

834

def get_index_stream():

835

with self._indexfp() as fp:

835

with self._indexfp() as fp:

836

yield None

836

yield None

837

if index_size <= 65536:

837

if index_size <= 65536:

838

yield fp.read(index_size)

838

yield fp.read(index_size)

839

else:

839

else:

840

yield from util.filechunkiter(fp, limit=index_size)

840

yield from util.filechunkiter(fp, limit=index_size)

841

842

def get_data_stream():

842

def get_data_stream():

843

with self._datafp() as fp:

843

with self._datafp() as fp:

844

yield None

844

yield None

845

if data_size <= 65536:

845

if data_size <= 65536:

846

yield fp.read(data_size)

846

yield fp.read(data_size)

847

else:

847

else:

848

yield from util.filechunkiter(fp, limit=data_size)

848

yield from util.filechunkiter(fp, limit=data_size)

849

850

index_stream = get_index_stream()

850

index_stream = get_index_stream()

851

next(index_stream)

851

next(index_stream)

852

data_stream = get_data_stream()

852

data_stream = get_data_stream()

853

next(data_stream)

853

next(data_stream)

854

return [

854

return [

855

(self._datafile, data_stream, data_size),

855

(self._datafile, data_stream, data_size),

856

(self._indexfile, index_stream, index_size),

856

(self._indexfile, index_stream, index_size),

857

]

857

]

858

859

def _loadindex(self, docket=None):

859

def _loadindex(self, docket=None):

860

861

new_header, mmapindexthreshold, force_nodemap = self._init_opts()

861

new_header, mmapindexthreshold, force_nodemap = self._init_opts()

862

863

if self.postfix is not None:

863

if self.postfix is not None:

864

entry_point = b'%s.i.%s' % (self.radix, self.postfix)

864

entry_point = b'%s.i.%s' % (self.radix, self.postfix)

865

elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):

865

elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):

866

entry_point = b'%s.i.a' % self.radix

866

entry_point = b'%s.i.a' % self.radix

867

elif self._try_split and self.opener.exists(self._split_index_file):

867

elif self._try_split and self.opener.exists(self._split_index_file):

868

entry_point = self._split_index_file

868

entry_point = self._split_index_file

869

else:

869

else:

870

entry_point = b'%s.i' % self.radix

870

entry_point = b'%s.i' % self.radix

871

872

if docket is not None:

872

if docket is not None:

873

self._docket = docket

873

self._docket = docket

874

self._docket_file = entry_point

874

self._docket_file = entry_point

875

else:

875

else:

876

self._initempty = True

876

self._initempty = True

877

entry_data = self._get_data(entry_point, mmapindexthreshold)

877

entry_data = self._get_data(entry_point, mmapindexthreshold)

878

if len(entry_data) > 0:

878

if len(entry_data) > 0:

879

header = INDEX_HEADER.unpack(entry_data[:4])[0]

879

header = INDEX_HEADER.unpack(entry_data[:4])[0]

880

self._initempty = False

880

self._initempty = False

881

else:

881

else:

882

header = new_header

882

header = new_header

883

884

self._format_flags = header & ~0xFFFF

884

self._format_flags = header & ~0xFFFF

885

self._format_version = header & 0xFFFF

885

self._format_version = header & 0xFFFF

886

887

supported_flags = SUPPORTED_FLAGS.get(self._format_version)

887

supported_flags = SUPPORTED_FLAGS.get(self._format_version)

888

if supported_flags is None:

888

if supported_flags is None:

889

msg = _(b'unknown version (%d) in revlog %s')

889

msg = _(b'unknown version (%d) in revlog %s')

890

msg %= (self._format_version, self.display_id)

890

msg %= (self._format_version, self.display_id)

891

raise error.RevlogError(msg)

891

raise error.RevlogError(msg)

892

elif self._format_flags & ~supported_flags:

892

elif self._format_flags & ~supported_flags:

893

msg = _(b'unknown flags (%#04x) in version %d revlog %s')

893

msg = _(b'unknown flags (%#04x) in version %d revlog %s')

894

display_flag = self._format_flags >> 16

894

display_flag = self._format_flags >> 16

895

msg %= (display_flag, self._format_version, self.display_id)

895

msg %= (display_flag, self._format_version, self.display_id)

896

raise error.RevlogError(msg)

896

raise error.RevlogError(msg)

897

898

features = FEATURES_BY_VERSION[self._format_version]

898

features = FEATURES_BY_VERSION[self._format_version]

899

self._inline = features[b'inline'](self._format_flags)

899

self._inline = features[b'inline'](self._format_flags)

900

self.delta_config.general_delta = features[b'generaldelta'](

900

self.delta_config.general_delta = features[b'generaldelta'](

901

self._format_flags

901

self._format_flags

902

)

902

)

903

self.feature_config.has_side_data = features[b'sidedata']

903

self.feature_config.has_side_data = features[b'sidedata']

904

905

if not features[b'docket']:

905

if not features[b'docket']:

906

self._indexfile = entry_point

906

self._indexfile = entry_point

907

index_data = entry_data

907

index_data = entry_data

908

else:

908

else:

909

self._docket_file = entry_point

909

self._docket_file = entry_point

910

if self._initempty:

910

if self._initempty:

911

self._docket = docketutil.default_docket(self, header)

911

self._docket = docketutil.default_docket(self, header)

912

else:

912

else:

913

self._docket = docketutil.parse_docket(

913

self._docket = docketutil.parse_docket(

914

self, entry_data, use_pending=self._trypending

914

self, entry_data, use_pending=self._trypending

915

)

915

)

916

917

if self._docket is not None:

917

if self._docket is not None:

918

self._indexfile = self._docket.index_filepath()

918

self._indexfile = self._docket.index_filepath()

919

index_data = b''

919

index_data = b''

920

index_size = self._docket.index_end

920

index_size = self._docket.index_end

921

if index_size > 0:

921

if index_size > 0:

922

index_data = self._get_data(

922

index_data = self._get_data(

923

self._indexfile, mmapindexthreshold, size=index_size

923

self._indexfile, mmapindexthreshold, size=index_size

924

)

924

)

925

if len(index_data) < index_size:

925

if len(index_data) < index_size:

926

msg = _(b'too few index data for %s: got %d, expected %d')

926

msg = _(b'too few index data for %s: got %d, expected %d')

927

msg %= (self.display_id, len(index_data), index_size)

927

msg %= (self.display_id, len(index_data), index_size)

928

raise error.RevlogError(msg)

928

raise error.RevlogError(msg)

929

930

self._inline = False

930

self._inline = False

931

# generaldelta implied by version 2 revlogs.

931

# generaldelta implied by version 2 revlogs.

932

self.delta_config.general_delta = True

932

self.delta_config.general_delta = True

933

# the logic for persistent nodemap will be dealt with within the

933

# the logic for persistent nodemap will be dealt with within the

934

# main docket, so disable it for now.

934

# main docket, so disable it for now.

935

self._nodemap_file = None

935

self._nodemap_file = None

936

937

if self._docket is not None:

937

if self._docket is not None:

938

self._datafile = self._docket.data_filepath()

938

self._datafile = self._docket.data_filepath()

939

self._sidedatafile = self._docket.sidedata_filepath()

939

self._sidedatafile = self._docket.sidedata_filepath()

940

elif self.postfix is None:

940

elif self.postfix is None:

941

self._datafile = b'%s.d' % self.radix

941

self._datafile = b'%s.d' % self.radix

942

else:

942

else:

943

self._datafile = b'%s.d.%s' % (self.radix, self.postfix)

943

self._datafile = b'%s.d.%s' % (self.radix, self.postfix)

944

945

self.nodeconstants = sha1nodeconstants

945

self.nodeconstants = sha1nodeconstants

946

self.nullid = self.nodeconstants.nullid

946

self.nullid = self.nodeconstants.nullid

947

948

# sparse-revlog can't be on without general-delta (issue6056)

948

# sparse-revlog can't be on without general-delta (issue6056)

949

if not self.delta_config.general_delta:

949

if not self.delta_config.general_delta:

950

self.delta_config.sparse_revlog = False

950

self.delta_config.sparse_revlog = False

951

952

self._storedeltachains = True

952

self._storedeltachains = True

953

954

devel_nodemap = (

954

devel_nodemap = (

955

self._nodemap_file

955

self._nodemap_file

956

and force_nodemap

956

and force_nodemap

957

and parse_index_v1_nodemap is not None

957

and parse_index_v1_nodemap is not None

958

)

958

)

959

960

use_rust_index = False

960

use_rust_index = False

961

if rustrevlog is not None:

961

if rustrevlog is not None:

962

if self._nodemap_file is not None:

962

if self._nodemap_file is not None:

963

use_rust_index = True

963

use_rust_index = True

964

else:

964

else:

965

use_rust_index = self.opener.options.get(b'rust.index')

965

use_rust_index = self.opener.options.get(b'rust.index')

966

967

self._parse_index = parse_index_v1

967

self._parse_index = parse_index_v1

968

if self._format_version == REVLOGV0:

968

if self._format_version == REVLOGV0:

969

self._parse_index = revlogv0.parse_index_v0

969

self._parse_index = revlogv0.parse_index_v0

970

elif self._format_version == REVLOGV2:

970

elif self._format_version == REVLOGV2:

971

self._parse_index = parse_index_v2

971

self._parse_index = parse_index_v2

972

elif self._format_version == CHANGELOGV2:

972

elif self._format_version == CHANGELOGV2:

973

self._parse_index = parse_index_cl_v2

973

self._parse_index = parse_index_cl_v2

974

elif devel_nodemap:

974

elif devel_nodemap:

975

self._parse_index = parse_index_v1_nodemap

975

self._parse_index = parse_index_v1_nodemap

976

elif use_rust_index:

976

elif use_rust_index:

977

self._parse_index = parse_index_v1_mixed

977

self._parse_index = parse_index_v1_mixed

978

try:

978

try:

979

d = self._parse_index(index_data, self._inline)

979

d = self._parse_index(index_data, self._inline)

980

index, chunkcache = d

980

index, chunkcache = d

981

use_nodemap = (

981

use_nodemap = (

982

not self._inline

982

not self._inline

983

and self._nodemap_file is not None

983

and self._nodemap_file is not None

984

and hasattr(index, 'update_nodemap_data')

984

and hasattr(index, 'update_nodemap_data')

985

)

985

)

986

if use_nodemap:

986

if use_nodemap:

987

nodemap_data = nodemaputil.persisted_data(self)

987

nodemap_data = nodemaputil.persisted_data(self)

988

if nodemap_data is not None:

988

if nodemap_data is not None:

989

docket = nodemap_data[0]

989

docket = nodemap_data[0]

990

if (

990

if (

991

len(d[0]) > docket.tip_rev

991

len(d[0]) > docket.tip_rev

992

and d[0][docket.tip_rev][7] == docket.tip_node

992

and d[0][docket.tip_rev][7] == docket.tip_node

993

):

993

):

994

# no changelog tampering

994

# no changelog tampering

995

self._nodemap_docket = docket

995

self._nodemap_docket = docket

996

index.update_nodemap_data(*nodemap_data)

996

index.update_nodemap_data(*nodemap_data)

997

except (ValueError, IndexError):

997

except (ValueError, IndexError):

998

raise error.RevlogError(

998

raise error.RevlogError(

999

_(b"index %s is corrupted") % self.display_id

999

_(b"index %s is corrupted") % self.display_id

1000

)

1000

)

1001

self.index = index

1001

self.index = index

1002

self._segmentfile = randomaccessfile.randomaccessfile(

1002

self._segmentfile = randomaccessfile.randomaccessfile(

1003

self.opener,

1003

self.opener,

1004

(self._indexfile if self._inline else self._datafile),

1004

(self._indexfile if self._inline else self._datafile),

1005

self.data_config.chunk_cache_size,

1005

self.data_config.chunk_cache_size,

1006

chunkcache,

1006

chunkcache,

1007

)

1007

)

1008

self._segmentfile_sidedata = randomaccessfile.randomaccessfile(

1008

self._segmentfile_sidedata = randomaccessfile.randomaccessfile(

1009

self.opener,

1009

self.opener,

1010

self._sidedatafile,

1010

self._sidedatafile,

1011

self.data_config.chunk_cache_size,

1011

self.data_config.chunk_cache_size,

1012

)

1012

)

1013

# revnum -> (chain-length, sum-delta-length)

1013

# revnum -> (chain-length, sum-delta-length)

1014

self._chaininfocache = util.lrucachedict(500)

1014

self._chaininfocache = util.lrucachedict(500)

1015

# revlog header -> revlog compressor

1015

# revlog header -> revlog compressor

1016

self._decompressors = {}

1016

self._decompressors = {}

1017

1018

def get_revlog(self):

1018

def get_revlog(self):

1019

"""simple function to mirror API of other not-really-revlog API"""

1019

"""simple function to mirror API of other not-really-revlog API"""

1020

return self

1020

return self

1021

1022

@util.propertycache

1022

@util.propertycache

1023

def revlog_kind(self):

1023

def revlog_kind(self):

1024

return self.target[0]

1024

return self.target[0]

1025

1026

@util.propertycache

1026

@util.propertycache

1027

def display_id(self):

1027

def display_id(self):

1028

"""The public facing "ID" of the revlog that we use in message"""

1028

"""The public facing "ID" of the revlog that we use in message"""

1029

if self.revlog_kind == KIND_FILELOG:

1029

if self.revlog_kind == KIND_FILELOG:

1030

# Reference the file without the "data/" prefix, so it is familiar

1030

# Reference the file without the "data/" prefix, so it is familiar

1031

# to the user.

1031

# to the user.

1032

return self.target[1]

1032

return self.target[1]

1033

else:

1033

else:

1034

return self.radix

1034

return self.radix

1035

1036

def _get_decompressor(self, t):

1036

def _get_decompressor(self, t):

1037

try:

1037

try:

1038

compressor = self._decompressors[t]

1038

compressor = self._decompressors[t]

1039

except KeyError:

1039

except KeyError:

1040

try:

1040

try:

1041

engine = util.compengines.forrevlogheader(t)

1041

engine = util.compengines.forrevlogheader(t)

1042

compressor = engine.revlogcompressor(

1042

compressor = engine.revlogcompressor(

1043

self.feature_config.compression_engine_options

1043

self.feature_config.compression_engine_options

1044

)

1044

)

1045

self._decompressors[t] = compressor

1045

self._decompressors[t] = compressor

1046

except KeyError:

1046

except KeyError:

1047

raise error.RevlogError(

1047

raise error.RevlogError(

1048

_(b'unknown compression type %s') % binascii.hexlify(t)

1048

_(b'unknown compression type %s') % binascii.hexlify(t)

1049

)

1049

)

1050

return compressor

1050

return compressor

1051

1052

@util.propertycache

1052

@util.propertycache

1053

def _compressor(self):

1053

def _compressor(self):

1054

engine = util.compengines[self.feature_config.compression_engine]

1054

engine = util.compengines[self.feature_config.compression_engine]

1055

return engine.revlogcompressor(

1055

return engine.revlogcompressor(

1056

self.feature_config.compression_engine_options

1056

self.feature_config.compression_engine_options

1057

)

1057

)

1058

1059

@util.propertycache

1059

@util.propertycache

1060

def _decompressor(self):

1060

def _decompressor(self):

1061

"""the default decompressor"""

1061

"""the default decompressor"""

1062

if self._docket is None:

1062

if self._docket is None:

1063

return None

1063

return None

1064

t = self._docket.default_compression_header

1064

t = self._docket.default_compression_header

1065

c = self._get_decompressor(t)

1065

c = self._get_decompressor(t)

1066

return c.decompress

1066

return c.decompress

1067

1068

def _indexfp(self):

1068

def _indexfp(self):

1069

"""file object for the revlog's index file"""

1069

"""file object for the revlog's index file"""

1070

return self.opener(self._indexfile, mode=b"r")

1070

return self.opener(self._indexfile, mode=b"r")

1071

1072

def __index_write_fp(self):

1072

def __index_write_fp(self):

1073

# You should not use this directly and use `_writing` instead

1073

# You should not use this directly and use `_writing` instead

1074

try:

1074

try:

1075

f = self.opener(

1075

f = self.opener(

1076

self._indexfile,

1076

self._indexfile,

1077

mode=b"r+",

1077

mode=b"r+",

1078

checkambig=self.data_config.check_ambig,

1078

checkambig=self.data_config.check_ambig,

1079

)

1079

)

1080

if self._docket is None:

1080

if self._docket is None:

1081

f.seek(0, os.SEEK_END)

1081

f.seek(0, os.SEEK_END)

1082

else:

1082

else:

1083

f.seek(self._docket.index_end, os.SEEK_SET)

1083

f.seek(self._docket.index_end, os.SEEK_SET)

1084

return f

1084

return f

1085

except FileNotFoundError:

1085

except FileNotFoundError:

1086

return self.opener(

1086

return self.opener(

1087

self._indexfile,

1087

self._indexfile,

1088

mode=b"w+",

1088

mode=b"w+",

1089

checkambig=self.data_config.check_ambig,

1089

checkambig=self.data_config.check_ambig,

1090

)

1090

)

1091

1092

def __index_new_fp(self):

1092

def __index_new_fp(self):

1093

# You should not use this unless you are upgrading from inline revlog

1093

# You should not use this unless you are upgrading from inline revlog

1094

return self.opener(

1094

return self.opener(

1095

self._indexfile,

1095

self._indexfile,

1096

mode=b"w",

1096

mode=b"w",

1097

checkambig=self.data_config.check_ambig,

1097

checkambig=self.data_config.check_ambig,

1098

atomictemp=True,

1098

atomictemp=True,

1099

)

1099

)

1100

1101

def _datafp(self, mode=b'r'):

1101

def _datafp(self, mode=b'r'):

1102

"""file object for the revlog's data file"""

1102

"""file object for the revlog's data file"""

1103

return self.opener(self._datafile, mode=mode)

1103

return self.opener(self._datafile, mode=mode)

1104

1105

@contextlib.contextmanager

1105

@contextlib.contextmanager

1106

def _sidedatareadfp(self):

1106

def _sidedatareadfp(self):

1107

"""file object suitable to read sidedata"""

1107

"""file object suitable to read sidedata"""

1108

if self._writinghandles:

1108

if self._writinghandles:

1109

yield self._writinghandles[2]

1109

yield self._writinghandles[2]

1110

else:

1110

else:

1111

with self.opener(self._sidedatafile) as fp:

1111

with self.opener(self._sidedatafile) as fp:

1112

yield fp

1112

yield fp

1113

1114

def tiprev(self):

1114

def tiprev(self):

1115

return len(self.index) - 1

1115

return len(self.index) - 1

1116

1117

def tip(self):

1117

def tip(self):

1118

return self.node(self.tiprev())

1118

return self.node(self.tiprev())

1119

1120

def __contains__(self, rev):

1120

def __contains__(self, rev):

1121

return 0 <= rev < len(self)

1121

return 0 <= rev < len(self)

1122

1123

def __len__(self):

1123

def __len__(self):

1124

return len(self.index)

1124

return len(self.index)

1125

1126

def __iter__(self):

1126

def __iter__(self):

1127

return iter(range(len(self)))

1127

return iter(range(len(self)))

1128

1129

def revs(self, start=0, stop=None):

1129

def revs(self, start=0, stop=None):

1130

"""iterate over all rev in this revlog (from start to stop)"""

1130

"""iterate over all rev in this revlog (from start to stop)"""

1131

return storageutil.iterrevs(len(self), start=start, stop=stop)

1131

return storageutil.iterrevs(len(self), start=start, stop=stop)

1132

1133

def hasnode(self, node):

1133

def hasnode(self, node):

1134

try:

1134

try:

1135

self.rev(node)

1135

self.rev(node)

1136

return True

1136

return True

1137

except KeyError:

1137

except KeyError:

1138

return False

1138

return False

1139

1140

def _candelta(self, baserev, rev):

1140

def _candelta(self, baserev, rev):

1141

"""whether two revisions (baserev, rev) can be delta-ed or not"""

1141

"""whether two revisions (baserev, rev) can be delta-ed or not"""

1142

# Disable delta if either rev requires a content-changing flag

1142

# Disable delta if either rev requires a content-changing flag

1143

# processor (ex. LFS). This is because such flag processor can alter

1143

# processor (ex. LFS). This is because such flag processor can alter

1144

# the rawtext content that the delta will be based on, and two clients

1144

# the rawtext content that the delta will be based on, and two clients

1145

# could have a same revlog node with different flags (i.e. different

1145

# could have a same revlog node with different flags (i.e. different

1146

# rawtext contents) and the delta could be incompatible.

1146

# rawtext contents) and the delta could be incompatible.

1147

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

1147

if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (

1148

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

1148

self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS

1149

):

1149

):

1150

return False

1150

return False

1151

return True

1151

return True

1152

1153

def update_caches(self, transaction):

1153

def update_caches(self, transaction):

1154

"""update on disk cache

1154

"""update on disk cache

1155

1156

If a transaction is passed, the update may be delayed to transaction

1156

If a transaction is passed, the update may be delayed to transaction

1157

commit."""

1157

commit."""

1158

if self._nodemap_file is not None:

1158

if self._nodemap_file is not None:

1159

if transaction is None:

1159

if transaction is None:

1160

nodemaputil.update_persistent_nodemap(self)

1160

nodemaputil.update_persistent_nodemap(self)

1161

else:

1161

else:

1162

nodemaputil.setup_persistent_nodemap(transaction, self)

1162

nodemaputil.setup_persistent_nodemap(transaction, self)

1163

1164

def clearcaches(self):

1164

def clearcaches(self):

1165

"""Clear in-memory caches"""

1165

"""Clear in-memory caches"""

1166

self._revisioncache = None

1166

self._revisioncache = None

1167

self._chainbasecache.clear()

1167

self._chainbasecache.clear()

1168

self._segmentfile.clear_cache()

1168

self._segmentfile.clear_cache()

1169

self._segmentfile_sidedata.clear_cache()

1169

self._segmentfile_sidedata.clear_cache()

1170

self._pcache = {}

1170

self._pcache = {}

1171

self._nodemap_docket = None

1171

self._nodemap_docket = None

1172

self.index.clearcaches()

1172

self.index.clearcaches()

1173

# The python code is the one responsible for validating the docket, we

1173

# The python code is the one responsible for validating the docket, we

1174

# end up having to refresh it here.

1174

# end up having to refresh it here.

1175

use_nodemap = (

1175

use_nodemap = (

1176

not self._inline

1176

not self._inline

1177

and self._nodemap_file is not None

1177

and self._nodemap_file is not None

1178

and hasattr(self.index, 'update_nodemap_data')

1178

and hasattr(self.index, 'update_nodemap_data')

1179

)

1179

)

1180

if use_nodemap:

1180

if use_nodemap:

1181

nodemap_data = nodemaputil.persisted_data(self)

1181

nodemap_data = nodemaputil.persisted_data(self)

1182

if nodemap_data is not None:

1182

if nodemap_data is not None:

1183

self._nodemap_docket = nodemap_data[0]

1183

self._nodemap_docket = nodemap_data[0]

1184

self.index.update_nodemap_data(*nodemap_data)

1184

self.index.update_nodemap_data(*nodemap_data)

1185

1186

def rev(self, node):

1186

def rev(self, node):

1187

"""return the revision number associated with a <nodeid>"""

1187

"""return the revision number associated with a <nodeid>"""

1188

try:

1188

try:

1189

return self.index.rev(node)

1189

return self.index.rev(node)

1190

except TypeError:

1190

except TypeError:

1191

raise

1191

raise

1192

except error.RevlogError:

1192

except error.RevlogError:

1193

# parsers.c radix tree lookup failed

1193

# parsers.c radix tree lookup failed

1194

if (

1194

if (

1195

node == self.nodeconstants.wdirid

1195

node == self.nodeconstants.wdirid

1196

or node in self.nodeconstants.wdirfilenodeids

1196

or node in self.nodeconstants.wdirfilenodeids

1197

):

1197

):

1198

raise error.WdirUnsupported

1198

raise error.WdirUnsupported

1199

raise error.LookupError(node, self.display_id, _(b'no node'))

1199

raise error.LookupError(node, self.display_id, _(b'no node'))

1200

1201

# Accessors for index entries.

1201

# Accessors for index entries.

1202

1203

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

1203

# First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes

1204

# are flags.

1204

# are flags.

1205

def start(self, rev):

1205

def start(self, rev):

1206

return int(self.index[rev][0] >> 16)

1206

return int(self.index[rev][0] >> 16)

1207

1208

def sidedata_cut_off(self, rev):

1208

def sidedata_cut_off(self, rev):

1209

sd_cut_off = self.index[rev][8]

1209

sd_cut_off = self.index[rev][8]

1210

if sd_cut_off != 0:

1210

if sd_cut_off != 0:

1211

return sd_cut_off

1211

return sd_cut_off

1212

# This is some annoying dance, because entries without sidedata

1212

# This is some annoying dance, because entries without sidedata

1213

# currently use 0 as their ofsset. (instead of previous-offset +

1213

# currently use 0 as their ofsset. (instead of previous-offset +

1214

# previous-size)

1214

# previous-size)

1215

#

1215

#

1216

# We should reconsider this sidedata → 0 sidata_offset policy.

1216

# We should reconsider this sidedata → 0 sidata_offset policy.

1217

# In the meantime, we need this.

1217

# In the meantime, we need this.

1218

while 0 <= rev:

1218

while 0 <= rev:

1219

e = self.index[rev]

1219

e = self.index[rev]

1220

if e[9] != 0:

1220

if e[9] != 0:

1221

return e[8] + e[9]

1221

return e[8] + e[9]

1222

rev -= 1

1222

rev -= 1

1223

return 0

1223

return 0

1224

1225

def flags(self, rev):

1225

def flags(self, rev):

1226

return self.index[rev][0] & 0xFFFF

1226

return self.index[rev][0] & 0xFFFF

1227

1228

def length(self, rev):

1228

def length(self, rev):

1229

return self.index[rev][1]

1229

return self.index[rev][1]

1230

1231

def sidedata_length(self, rev):

1231

def sidedata_length(self, rev):

1232

if not self.feature_config.has_side_data:

1232

if not self.feature_config.has_side_data:

1233

return 0

1233

return 0

1234

return self.index[rev][9]

1234

return self.index[rev][9]

1235

1236

def rawsize(self, rev):

1236

def rawsize(self, rev):

1237

"""return the length of the uncompressed text for a given revision"""

1237

"""return the length of the uncompressed text for a given revision"""

1238

l = self.index[rev][2]

1238

l = self.index[rev][2]

1239

if l >= 0:

1239

if l >= 0:

1240

return l

1240

return l

1241

1242

t = self.rawdata(rev)

1242

t = self.rawdata(rev)

1243

return len(t)

1243

return len(t)

1244

1245

def size(self, rev):

1245

def size(self, rev):

1246

"""length of non-raw text (processed by a "read" flag processor)"""

1246

"""length of non-raw text (processed by a "read" flag processor)"""

1247

# fast path: if no "read" flag processor could change the content,

1247

# fast path: if no "read" flag processor could change the content,

1248

# size is rawsize. note: ELLIPSIS is known to not change the content.

1248

# size is rawsize. note: ELLIPSIS is known to not change the content.

1249

flags = self.flags(rev)

1249

flags = self.flags(rev)

1250

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

1250

if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:

1251

return self.rawsize(rev)

1251

return self.rawsize(rev)

1252

1253

return len(self.revision(rev))

1253

return len(self.revision(rev))

1254

1255

def fast_rank(self, rev):

1255

def fast_rank(self, rev):

1256

"""Return the rank of a revision if already known, or None otherwise.

1256

"""Return the rank of a revision if already known, or None otherwise.

1257

1258

The rank of a revision is the size of the sub-graph it defines as a

1258

The rank of a revision is the size of the sub-graph it defines as a

1259

head. Equivalently, the rank of a revision `r` is the size of the set

1259

head. Equivalently, the rank of a revision `r` is the size of the set

1260

`ancestors(r)`, `r` included.

1260

`ancestors(r)`, `r` included.

1261

1262

This method returns the rank retrieved from the revlog in constant

1262

This method returns the rank retrieved from the revlog in constant

1263

time. It makes no attempt at computing unknown values for versions of

1263

time. It makes no attempt at computing unknown values for versions of

1264

the revlog which do not persist the rank.

1264

the revlog which do not persist the rank.

1265

"""

1265

"""

1266

rank = self.index[rev][ENTRY_RANK]

1266

rank = self.index[rev][ENTRY_RANK]

1267

if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:

1267

if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:

1268

return None

1268

return None

1269

if rev == nullrev:

1269

if rev == nullrev:

1270

return 0 # convention

1270

return 0 # convention

1271

return rank

1271

return rank

1272

1273

def chainbase(self, rev):

1273

def chainbase(self, rev):

1274

base = self._chainbasecache.get(rev)

1274

base = self._chainbasecache.get(rev)

1275

if base is not None:

1275

if base is not None:

1276

return base

1276

return base

1277

1278

index = self.index

1278

index = self.index

1279

iterrev = rev

1279

iterrev = rev

1280

base = index[iterrev][3]

1280

base = index[iterrev][3]

1281

while base != iterrev:

1281

while base != iterrev:

1282

iterrev = base

1282

iterrev = base

1283

base = index[iterrev][3]

1283

base = index[iterrev][3]

1284

1285

self._chainbasecache[rev] = base

1285

self._chainbasecache[rev] = base

1286

return base

1286

return base

1287

1288

def linkrev(self, rev):

1288

def linkrev(self, rev):

1289

return self.index[rev][4]

1289

return self.index[rev][4]

1290

1291

def parentrevs(self, rev):

1291

def parentrevs(self, rev):

1292

try:

1292

try:

1293

entry = self.index[rev]

1293

entry = self.index[rev]

1294

except IndexError:

1294

except IndexError:

1295

if rev == wdirrev:

1295

if rev == wdirrev:

1296

raise error.WdirUnsupported

1296

raise error.WdirUnsupported

1297

raise

1297

raise

1298

1299

if self.feature_config.canonical_parent_order and entry[5] == nullrev:

1299

if self.feature_config.canonical_parent_order and entry[5] == nullrev:

1300

return entry[6], entry[5]

1300

return entry[6], entry[5]

1301

else:

1301

else:

1302

return entry[5], entry[6]

1302

return entry[5], entry[6]

1303

1304

# fast parentrevs(rev) where rev isn't filtered

1304

# fast parentrevs(rev) where rev isn't filtered

1305

_uncheckedparentrevs = parentrevs

1305

_uncheckedparentrevs = parentrevs

1306

1307

def node(self, rev):

1307

def node(self, rev):

1308

try:

1308

try:

1309

return self.index[rev][7]

1309

return self.index[rev][7]

1310

except IndexError:

1310

except IndexError:

1311

if rev == wdirrev:

1311

if rev == wdirrev:

1312

raise error.WdirUnsupported

1312

raise error.WdirUnsupported

1313

raise

1313

raise

1314

1315

# Derived from index values.

1315

# Derived from index values.

1316

1317

def end(self, rev):

1317

def end(self, rev):

1318

return self.start(rev) + self.length(rev)

1318

return self.start(rev) + self.length(rev)

1319

1320

def parents(self, node):

1320

def parents(self, node):

1321

i = self.index

1321

i = self.index

1322

d = i[self.rev(node)]

1322

d = i[self.rev(node)]

1323

# inline node() to avoid function call overhead

1323

# inline node() to avoid function call overhead

1324

if self.feature_config.canonical_parent_order and d[5] == self.nullid:

1324

if self.feature_config.canonical_parent_order and d[5] == self.nullid:

1325

return i[d[6]][7], i[d[5]][7]

1325

return i[d[6]][7], i[d[5]][7]

1326

else:

1326

else:

1327

return i[d[5]][7], i[d[6]][7]

1327

return i[d[5]][7], i[d[6]][7]

1328

1329

def chainlen(self, rev):

1329

def chainlen(self, rev):

1330

return self._chaininfo(rev)[0]

1330

return self._chaininfo(rev)[0]

1331

1332

def _chaininfo(self, rev):

1332

def _chaininfo(self, rev):

1333

chaininfocache = self._chaininfocache

1333

chaininfocache = self._chaininfocache

1334

if rev in chaininfocache:

1334

if rev in chaininfocache:

1335

return chaininfocache[rev]

1335

return chaininfocache[rev]

1336

index = self.index

1336

index = self.index

1337

generaldelta = self.delta_config.general_delta

1337

generaldelta = self.delta_config.general_delta

1338

iterrev = rev

1338

iterrev = rev

1339

e = index[iterrev]

1339

e = index[iterrev]

1340

clen = 0

1340

clen = 0

1341

compresseddeltalen = 0

1341

compresseddeltalen = 0

1342

while iterrev != e[3]:

1342

while iterrev != e[3]:

1343

clen += 1

1343

clen += 1

1344

compresseddeltalen += e[1]

1344

compresseddeltalen += e[1]

1345

if generaldelta:

1345

if generaldelta:

1346

iterrev = e[3]

1346

iterrev = e[3]

1347

else:

1347

else:

1348

iterrev -= 1

1348

iterrev -= 1

1349

if iterrev in chaininfocache:

1349

if iterrev in chaininfocache:

1350

t = chaininfocache[iterrev]

1350

t = chaininfocache[iterrev]

1351

clen += t[0]

1351

clen += t[0]

1352

compresseddeltalen += t[1]

1352

compresseddeltalen += t[1]

1353

break

1353

break

1354

e = index[iterrev]

1354

e = index[iterrev]

1355

else:

1355

else:

1356

# Add text length of base since decompressing that also takes

1356

# Add text length of base since decompressing that also takes

1357

# work. For cache hits the length is already included.

1357

# work. For cache hits the length is already included.

1358

compresseddeltalen += e[1]

1358

compresseddeltalen += e[1]

1359

r = (clen, compresseddeltalen)

1359

r = (clen, compresseddeltalen)

1360

chaininfocache[rev] = r

1360

chaininfocache[rev] = r

1361

return r

1361

return r

1362

1363

def _deltachain(self, rev, stoprev=None):

1363

def _deltachain(self, rev, stoprev=None):

1364

"""Obtain the delta chain for a revision.

1364

"""Obtain the delta chain for a revision.

1365

1366

``stoprev`` specifies a revision to stop at. If not specified, we

1366

``stoprev`` specifies a revision to stop at. If not specified, we

1367

stop at the base of the chain.

1367

stop at the base of the chain.

1368

1369

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

1369

Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of

1370

revs in ascending order and ``stopped`` is a bool indicating whether

1370

revs in ascending order and ``stopped`` is a bool indicating whether

1371

``stoprev`` was hit.

1371

``stoprev`` was hit.

1372

"""

1372

"""

1373

generaldelta = self.delta_config.general_delta

1373

generaldelta = self.delta_config.general_delta

1374

# Try C implementation.

1374

# Try C implementation.

1375

try:

1375

try:

1376

return self.index.deltachain(rev, stoprev, generaldelta)

1376

return self.index.deltachain(rev, stoprev, generaldelta)

1377

except AttributeError:

1377

except AttributeError:

1378

pass

1378

pass

1379

1380

chain = []

1380

chain = []

1381

1382

# Alias to prevent attribute lookup in tight loop.

1382

# Alias to prevent attribute lookup in tight loop.

1383

index = self.index

1383

index = self.index

1384

1385

iterrev = rev

1385

iterrev = rev

1386

e = index[iterrev]

1386

e = index[iterrev]

1387

while iterrev != e[3] and iterrev != stoprev:

1387

while iterrev != e[3] and iterrev != stoprev:

1388

chain.append(iterrev)

1388

chain.append(iterrev)

1389

if generaldelta:

1389

if generaldelta:

1390

iterrev = e[3]

1390

iterrev = e[3]

1391

else:

1391

else:

1392

iterrev -= 1

1392

iterrev -= 1

1393

e = index[iterrev]

1393

e = index[iterrev]

1394

1395

if iterrev == stoprev:

1395

if iterrev == stoprev:

1396

stopped = True

1396

stopped = True

1397

else:

1397

else:

1398

chain.append(iterrev)

1398

chain.append(iterrev)

1399

stopped = False

1399

stopped = False

1400

1401

chain.reverse()

1401

chain.reverse()

1402

return chain, stopped

1402

return chain, stopped

1403

1404

def ancestors(self, revs, stoprev=0, inclusive=False):

1404

def ancestors(self, revs, stoprev=0, inclusive=False):

1405

"""Generate the ancestors of 'revs' in reverse revision order.

1405

"""Generate the ancestors of 'revs' in reverse revision order.

1406

Does not generate revs lower than stoprev.

1406

Does not generate revs lower than stoprev.

1407

1408

See the documentation for ancestor.lazyancestors for more details."""

1408

See the documentation for ancestor.lazyancestors for more details."""

1409

1410

# first, make sure start revisions aren't filtered

1410

# first, make sure start revisions aren't filtered

1411

revs = list(revs)

1411

revs = list(revs)

1412

checkrev = self.node

1412

checkrev = self.node

1413

for r in revs:

1413

for r in revs:

1414

checkrev(r)

1414

checkrev(r)

1415

# and we're sure ancestors aren't filtered as well

1415

# and we're sure ancestors aren't filtered as well

1416

1417

if rustancestor is not None and self.index.rust_ext_compat:

1417

if rustancestor is not None and self.index.rust_ext_compat:

1418

lazyancestors = rustancestor.LazyAncestors

1418

lazyancestors = rustancestor.LazyAncestors

1419

arg = self.index

1419

arg = self.index

1420

else:

1420

else:

1421

lazyancestors = ancestor.lazyancestors

1421

lazyancestors = ancestor.lazyancestors

1422

arg = self._uncheckedparentrevs

1422

arg = self._uncheckedparentrevs

1423

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

1423

return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)

1424

1425

def descendants(self, revs):

1425

def descendants(self, revs):

1426

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

1426

return dagop.descendantrevs(revs, self.revs, self.parentrevs)

1427

1428

def findcommonmissing(self, common=None, heads=None):

1428

def findcommonmissing(self, common=None, heads=None):

1429

"""Return a tuple of the ancestors of common and the ancestors of heads

1429

"""Return a tuple of the ancestors of common and the ancestors of heads

1430

that are not ancestors of common. In revset terminology, we return the

1430

that are not ancestors of common. In revset terminology, we return the

1431

tuple:

1431

tuple:

1432

1433

::common, (::heads) - (::common)

1433

::common, (::heads) - (::common)

1434

1435

The list is sorted by revision number, meaning it is

1435

The list is sorted by revision number, meaning it is

1436

topologically sorted.

1436

topologically sorted.

1437

1438

'heads' and 'common' are both lists of node IDs. If heads is

1438

'heads' and 'common' are both lists of node IDs. If heads is

1439

not supplied, uses all of the revlog's heads. If common is not

1439

not supplied, uses all of the revlog's heads. If common is not

1440

supplied, uses nullid."""

1440

supplied, uses nullid."""

1441

if common is None:

1441

if common is None:

1442

common = [self.nullid]

1442

common = [self.nullid]

1443

if heads is None:

1443

if heads is None:

1444

heads = self.heads()

1444

heads = self.heads()

1445

1446

common = [self.rev(n) for n in common]

1446

common = [self.rev(n) for n in common]

1447

heads = [self.rev(n) for n in heads]

1447

heads = [self.rev(n) for n in heads]

1448

1449

# we want the ancestors, but inclusive

1449

# we want the ancestors, but inclusive

1450

class lazyset:

1450

class lazyset:

1451

def __init__(self, lazyvalues):

1451

def __init__(self, lazyvalues):

1452

self.addedvalues = set()

1452

self.addedvalues = set()

1453

self.lazyvalues = lazyvalues

1453

self.lazyvalues = lazyvalues

1454

1455

def __contains__(self, value):

1455

def __contains__(self, value):

1456

return value in self.addedvalues or value in self.lazyvalues

1456

return value in self.addedvalues or value in self.lazyvalues

1457

1458

def __iter__(self):

1458

def __iter__(self):

1459

added = self.addedvalues

1459

added = self.addedvalues

1460

for r in added:

1460

for r in added:

1461

yield r

1461

yield r

1462

for r in self.lazyvalues:

1462

for r in self.lazyvalues:

1463

if not r in added:

1463

if not r in added:

1464

yield r

1464

yield r

1465

1466

def add(self, value):

1466

def add(self, value):

1467

self.addedvalues.add(value)

1467

self.addedvalues.add(value)

1468

1469

def update(self, values):

1469

def update(self, values):

1470

self.addedvalues.update(values)

1470

self.addedvalues.update(values)

1471

1472

has = lazyset(self.ancestors(common))

1472

has = lazyset(self.ancestors(common))

1473

has.add(nullrev)

1473

has.add(nullrev)

1474

has.update(common)

1474

has.update(common)

1475

1476

# take all ancestors from heads that aren't in has

1476

# take all ancestors from heads that aren't in has

1477

missing = set()

1477

missing = set()

1478

visit = collections.deque(r for r in heads if r not in has)

1478

visit = collections.deque(r for r in heads if r not in has)

1479

while visit:

1479

while visit:

1480

r = visit.popleft()

1480

r = visit.popleft()

1481

if r in missing:

1481

if r in missing:

1482

continue

1482

continue

1483

else:

1483

else:

1484

missing.add(r)

1484

missing.add(r)

1485

for p in self.parentrevs(r):

1485

for p in self.parentrevs(r):

1486

if p not in has:

1486

if p not in has:

1487

visit.append(p)

1487

visit.append(p)

1488

missing = list(missing)

1488

missing = list(missing)

1489

missing.sort()

1489

missing.sort()

1490

return has, [self.node(miss) for miss in missing]

1490

return has, [self.node(miss) for miss in missing]

1491

1492

def incrementalmissingrevs(self, common=None):

1492

def incrementalmissingrevs(self, common=None):

1493

"""Return an object that can be used to incrementally compute the

1493

"""Return an object that can be used to incrementally compute the

1494

revision numbers of the ancestors of arbitrary sets that are not

1494

revision numbers of the ancestors of arbitrary sets that are not

1495

ancestors of common. This is an ancestor.incrementalmissingancestors

1495

ancestors of common. This is an ancestor.incrementalmissingancestors

1496

object.

1496

object.

1497

1498

'common' is a list of revision numbers. If common is not supplied, uses

1498

'common' is a list of revision numbers. If common is not supplied, uses

1499

nullrev.

1499

nullrev.

1500

"""

1500

"""

1501

if common is None:

1501

if common is None:

1502

common = [nullrev]

1502

common = [nullrev]

1503

1504

if rustancestor is not None and self.index.rust_ext_compat:

1504

if rustancestor is not None and self.index.rust_ext_compat:

1505

return rustancestor.MissingAncestors(self.index, common)

1505

return rustancestor.MissingAncestors(self.index, common)

1506

return ancestor.incrementalmissingancestors(self.parentrevs, common)

1506

return ancestor.incrementalmissingancestors(self.parentrevs, common)

1507

1508

def findmissingrevs(self, common=None, heads=None):

1508

def findmissingrevs(self, common=None, heads=None):

1509

"""Return the revision numbers of the ancestors of heads that

1509

"""Return the revision numbers of the ancestors of heads that

1510

are not ancestors of common.

1510

are not ancestors of common.

1511

1512

More specifically, return a list of revision numbers corresponding to

1512

More specifically, return a list of revision numbers corresponding to

1513

nodes N such that every N satisfies the following constraints:

1513

nodes N such that every N satisfies the following constraints:

1514

1515

1. N is an ancestor of some node in 'heads'

1515

1. N is an ancestor of some node in 'heads'

1516

2. N is not an ancestor of any node in 'common'

1516

2. N is not an ancestor of any node in 'common'

1517

1518

The list is sorted by revision number, meaning it is

1518

The list is sorted by revision number, meaning it is

1519

topologically sorted.

1519

topologically sorted.

1520

1521

'heads' and 'common' are both lists of revision numbers. If heads is

1521

'heads' and 'common' are both lists of revision numbers. If heads is

1522

not supplied, uses all of the revlog's heads. If common is not

1522

not supplied, uses all of the revlog's heads. If common is not

1523

supplied, uses nullid."""

1523

supplied, uses nullid."""

1524

if common is None:

1524

if common is None:

1525

common = [nullrev]

1525

common = [nullrev]

1526

if heads is None:

1526

if heads is None:

1527

heads = self.headrevs()

1527

heads = self.headrevs()

1528

1529

inc = self.incrementalmissingrevs(common=common)

1529

inc = self.incrementalmissingrevs(common=common)

1530

return inc.missingancestors(heads)

1530

return inc.missingancestors(heads)

1531

1532

def findmissing(self, common=None, heads=None):

1532

def findmissing(self, common=None, heads=None):

1533

"""Return the ancestors of heads that are not ancestors of common.

1533

"""Return the ancestors of heads that are not ancestors of common.

1534

1535

More specifically, return a list of nodes N such that every N

1535

More specifically, return a list of nodes N such that every N

1536

satisfies the following constraints:

1536

satisfies the following constraints:

1537

1538

1. N is an ancestor of some node in 'heads'

1538

1. N is an ancestor of some node in 'heads'

1539

2. N is not an ancestor of any node in 'common'

1539

2. N is not an ancestor of any node in 'common'

1540

1541

The list is sorted by revision number, meaning it is

1541

The list is sorted by revision number, meaning it is

1542

topologically sorted.

1542

topologically sorted.

1543

1544

'heads' and 'common' are both lists of node IDs. If heads is

1544

'heads' and 'common' are both lists of node IDs. If heads is

1545

not supplied, uses all of the revlog's heads. If common is not

1545

not supplied, uses all of the revlog's heads. If common is not

1546

supplied, uses nullid."""

1546

supplied, uses nullid."""

1547

if common is None:

1547

if common is None:

1548

common = [self.nullid]

1548

common = [self.nullid]

1549

if heads is None:

1549

if heads is None:

1550

heads = self.heads()

1550

heads = self.heads()

1551

1552

common = [self.rev(n) for n in common]

1552

common = [self.rev(n) for n in common]

1553

heads = [self.rev(n) for n in heads]

1553

heads = [self.rev(n) for n in heads]

1554

1555

inc = self.incrementalmissingrevs(common=common)

1555

inc = self.incrementalmissingrevs(common=common)

1556

return [self.node(r) for r in inc.missingancestors(heads)]

1556

return [self.node(r) for r in inc.missingancestors(heads)]

1557

1558

def nodesbetween(self, roots=None, heads=None):

1558

def nodesbetween(self, roots=None, heads=None):

1559

"""Return a topological path from 'roots' to 'heads'.

1559

"""Return a topological path from 'roots' to 'heads'.

1560

1561

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

1561

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

1562

topologically sorted list of all nodes N that satisfy both of

1562

topologically sorted list of all nodes N that satisfy both of

1563

these constraints:

1563

these constraints:

1564

1565

1. N is a descendant of some node in 'roots'

1565

1. N is a descendant of some node in 'roots'

1566

2. N is an ancestor of some node in 'heads'

1566

2. N is an ancestor of some node in 'heads'

1567

1568

Every node is considered to be both a descendant and an ancestor

1568

Every node is considered to be both a descendant and an ancestor

1569

of itself, so every reachable node in 'roots' and 'heads' will be

1569

of itself, so every reachable node in 'roots' and 'heads' will be

1570

included in 'nodes'.

1570

included in 'nodes'.

1571

1572

'outroots' is the list of reachable nodes in 'roots', i.e., the

1572

'outroots' is the list of reachable nodes in 'roots', i.e., the

1573

subset of 'roots' that is returned in 'nodes'. Likewise,

1573

subset of 'roots' that is returned in 'nodes'. Likewise,

1574

'outheads' is the subset of 'heads' that is also in 'nodes'.

1574

'outheads' is the subset of 'heads' that is also in 'nodes'.

1575

1576

'roots' and 'heads' are both lists of node IDs. If 'roots' is

1576

'roots' and 'heads' are both lists of node IDs. If 'roots' is

1577

unspecified, uses nullid as the only root. If 'heads' is

1577

unspecified, uses nullid as the only root. If 'heads' is

1578

unspecified, uses list of all of the revlog's heads."""

1578

unspecified, uses list of all of the revlog's heads."""

1579

nonodes = ([], [], [])

1579

nonodes = ([], [], [])

1580

if roots is not None:

1580

if roots is not None:

1581

roots = list(roots)

1581

roots = list(roots)

1582

if not roots:

1582

if not roots:

1583

return nonodes

1583

return nonodes

1584

lowestrev = min([self.rev(n) for n in roots])

1584

lowestrev = min([self.rev(n) for n in roots])

1585

else:

1585

else:

1586

roots = [self.nullid] # Everybody's a descendant of nullid

1586

roots = [self.nullid] # Everybody's a descendant of nullid

1587

lowestrev = nullrev

1587

lowestrev = nullrev

1588

if (lowestrev == nullrev) and (heads is None):

1588

if (lowestrev == nullrev) and (heads is None):

1589

# We want _all_ the nodes!

1589

# We want _all_ the nodes!

1590

return (

1590

return (

1591

[self.node(r) for r in self],

1591

[self.node(r) for r in self],

1592

[self.nullid],

1592

[self.nullid],

1593

list(self.heads()),

1593

list(self.heads()),

1594

)

1594

)

1595

if heads is None:

1595

if heads is None:

1596

# All nodes are ancestors, so the latest ancestor is the last

1596

# All nodes are ancestors, so the latest ancestor is the last

1597

# node.

1597

# node.

1598

highestrev = len(self) - 1

1598

highestrev = len(self) - 1

1599

# Set ancestors to None to signal that every node is an ancestor.

1599

# Set ancestors to None to signal that every node is an ancestor.

1600

ancestors = None

1600

ancestors = None

1601

# Set heads to an empty dictionary for later discovery of heads

1601

# Set heads to an empty dictionary for later discovery of heads

1602

heads = {}

1602

heads = {}

1603

else:

1603

else:

1604

heads = list(heads)

1604

heads = list(heads)

1605

if not heads:

1605

if not heads:

1606

return nonodes

1606

return nonodes

1607

ancestors = set()

1607

ancestors = set()

1608

# Turn heads into a dictionary so we can remove 'fake' heads.

1608

# Turn heads into a dictionary so we can remove 'fake' heads.

1609

# Also, later we will be using it to filter out the heads we can't

1609

# Also, later we will be using it to filter out the heads we can't

1610

# find from roots.

1610

# find from roots.

1611

heads = dict.fromkeys(heads, False)

1611

heads = dict.fromkeys(heads, False)

1612

# Start at the top and keep marking parents until we're done.

1612

# Start at the top and keep marking parents until we're done.

1613

nodestotag = set(heads)

1613

nodestotag = set(heads)

1614

# Remember where the top was so we can use it as a limit later.

1614

# Remember where the top was so we can use it as a limit later.

1615

highestrev = max([self.rev(n) for n in nodestotag])

1615

highestrev = max([self.rev(n) for n in nodestotag])

1616

while nodestotag:

1616

while nodestotag:

1617

# grab a node to tag

1617

# grab a node to tag

1618

n = nodestotag.pop()

1618

n = nodestotag.pop()

1619

# Never tag nullid

1619

# Never tag nullid

1620

if n == self.nullid:

1620

if n == self.nullid:

1621

continue

1621

continue

1622

# A node's revision number represents its place in a

1622

# A node's revision number represents its place in a

1623

# topologically sorted list of nodes.

1623

# topologically sorted list of nodes.

1624

r = self.rev(n)

1624

r = self.rev(n)

1625

if r >= lowestrev:

1625

if r >= lowestrev:

1626

if n not in ancestors:

1626

if n not in ancestors:

1627

# If we are possibly a descendant of one of the roots

1627

# If we are possibly a descendant of one of the roots

1628

# and we haven't already been marked as an ancestor

1628

# and we haven't already been marked as an ancestor

1629

ancestors.add(n) # Mark as ancestor

1629

ancestors.add(n) # Mark as ancestor

1630

# Add non-nullid parents to list of nodes to tag.

1630

# Add non-nullid parents to list of nodes to tag.

1631

nodestotag.update(

1631

nodestotag.update(

1632

[p for p in self.parents(n) if p != self.nullid]

1632

[p for p in self.parents(n) if p != self.nullid]

1633

)

1633

)

1634

elif n in heads: # We've seen it before, is it a fake head?

1634

elif n in heads: # We've seen it before, is it a fake head?

1635

# So it is, real heads should not be the ancestors of

1635

# So it is, real heads should not be the ancestors of

1636

# any other heads.

1636

# any other heads.

1637

heads.pop(n)

1637

heads.pop(n)

1638

if not ancestors:

1638

if not ancestors:

1639

return nonodes

1639

return nonodes

1640

# Now that we have our set of ancestors, we want to remove any

1640

# Now that we have our set of ancestors, we want to remove any

1641

# roots that are not ancestors.

1641

# roots that are not ancestors.

1642

1643

# If one of the roots was nullid, everything is included anyway.

1643

# If one of the roots was nullid, everything is included anyway.

1644

if lowestrev > nullrev:

1644

if lowestrev > nullrev:

1645

# But, since we weren't, let's recompute the lowest rev to not

1645

# But, since we weren't, let's recompute the lowest rev to not

1646

# include roots that aren't ancestors.

1646

# include roots that aren't ancestors.

1647

1648

# Filter out roots that aren't ancestors of heads

1648

# Filter out roots that aren't ancestors of heads

1649

roots = [root for root in roots if root in ancestors]

1649

roots = [root for root in roots if root in ancestors]

1650

# Recompute the lowest revision

1650

# Recompute the lowest revision

1651

if roots:

1651

if roots:

1652

lowestrev = min([self.rev(root) for root in roots])

1652

lowestrev = min([self.rev(root) for root in roots])

1653

else:

1653

else:

1654

# No more roots? Return empty list

1654

# No more roots? Return empty list

1655

return nonodes

1655

return nonodes

1656

else:

1656

else:

1657

# We are descending from nullid, and don't need to care about

1657

# We are descending from nullid, and don't need to care about

1658

# any other roots.

1658

# any other roots.

1659

lowestrev = nullrev

1659

lowestrev = nullrev

1660

roots = [self.nullid]

1660

roots = [self.nullid]

1661

# Transform our roots list into a set.

1661

# Transform our roots list into a set.

1662

descendants = set(roots)

1662

descendants = set(roots)

1663

# Also, keep the original roots so we can filter out roots that aren't

1663

# Also, keep the original roots so we can filter out roots that aren't

1664

# 'real' roots (i.e. are descended from other roots).

1664

# 'real' roots (i.e. are descended from other roots).

1665

roots = descendants.copy()

1665

roots = descendants.copy()

1666

# Our topologically sorted list of output nodes.

1666

# Our topologically sorted list of output nodes.

1667

orderedout = []

1667

orderedout = []

1668

# Don't start at nullid since we don't want nullid in our output list,

1668

# Don't start at nullid since we don't want nullid in our output list,

1669

# and if nullid shows up in descendants, empty parents will look like

1669

# and if nullid shows up in descendants, empty parents will look like

1670

# they're descendants.

1670

# they're descendants.

1671

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

1671

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

1672

n = self.node(r)

1672

n = self.node(r)

1673

isdescendant = False

1673

isdescendant = False

1674

if lowestrev == nullrev: # Everybody is a descendant of nullid

1674

if lowestrev == nullrev: # Everybody is a descendant of nullid

1675

isdescendant = True

1675

isdescendant = True

1676

elif n in descendants:

1676

elif n in descendants:

1677

# n is already a descendant

1677

# n is already a descendant

1678

isdescendant = True

1678

isdescendant = True

1679

# This check only needs to be done here because all the roots

1679

# This check only needs to be done here because all the roots

1680

# will start being marked is descendants before the loop.

1680

# will start being marked is descendants before the loop.

1681

if n in roots:

1681

if n in roots:

1682

# If n was a root, check if it's a 'real' root.

1682

# If n was a root, check if it's a 'real' root.

1683

p = tuple(self.parents(n))

1683

p = tuple(self.parents(n))

1684

# If any of its parents are descendants, it's not a root.

1684

# If any of its parents are descendants, it's not a root.

1685

if (p[0] in descendants) or (p[1] in descendants):

1685

if (p[0] in descendants) or (p[1] in descendants):

1686

roots.remove(n)

1686

roots.remove(n)

1687

else:

1687

else:

1688

p = tuple(self.parents(n))

1688

p = tuple(self.parents(n))

1689

# A node is a descendant if either of its parents are

1689

# A node is a descendant if either of its parents are

1690

# descendants. (We seeded the dependents list with the roots

1690

# descendants. (We seeded the dependents list with the roots

1691

# up there, remember?)

1691

# up there, remember?)

1692

if (p[0] in descendants) or (p[1] in descendants):

1692

if (p[0] in descendants) or (p[1] in descendants):

1693

descendants.add(n)

1693

descendants.add(n)

1694

isdescendant = True

1694

isdescendant = True

1695

if isdescendant and ((ancestors is None) or (n in ancestors)):

1695

if isdescendant and ((ancestors is None) or (n in ancestors)):

1696

# Only include nodes that are both descendants and ancestors.

1696

# Only include nodes that are both descendants and ancestors.

1697

orderedout.append(n)

1697

orderedout.append(n)

1698

if (ancestors is not None) and (n in heads):

1698

if (ancestors is not None) and (n in heads):

1699

# We're trying to figure out which heads are reachable

1699

# We're trying to figure out which heads are reachable

1700

# from roots.

1700

# from roots.

1701

# Mark this head as having been reached

1701

# Mark this head as having been reached

1702

heads[n] = True

1702

heads[n] = True

1703

elif ancestors is None:

1703

elif ancestors is None:

1704

# Otherwise, we're trying to discover the heads.

1704

# Otherwise, we're trying to discover the heads.

1705

# Assume this is a head because if it isn't, the next step

1705

# Assume this is a head because if it isn't, the next step

1706

# will eventually remove it.

1706

# will eventually remove it.

1707

heads[n] = True

1707

heads[n] = True

1708

# But, obviously its parents aren't.

1708

# But, obviously its parents aren't.

1709

for p in self.parents(n):

1709

for p in self.parents(n):

1710

heads.pop(p, None)

1710

heads.pop(p, None)

1711

heads = [head for head, flag in heads.items() if flag]

1711

heads = [head for head, flag in heads.items() if flag]

1712

roots = list(roots)

1712

roots = list(roots)

1713

assert orderedout

1713

assert orderedout

1714

assert roots

1714

assert roots

1715

assert heads

1715

assert heads

1716

return (orderedout, roots, heads)

1716

return (orderedout, roots, heads)

1717

1718

def headrevs(self, revs=None):

1718

def headrevs(self, revs=None):

1719

if revs is None:

1719

if revs is None:

1720

try:

1720

try:

1721

return self.index.headrevs()

1721

return self.index.headrevs()

1722

except AttributeError:

1722

except AttributeError:

1723

return self._headrevs()

1723

return self._headrevs()

1724

if rustdagop is not None and self.index.rust_ext_compat:

1724

if rustdagop is not None and self.index.rust_ext_compat:

1725

return rustdagop.headrevs(self.index, revs)

1725

return rustdagop.headrevs(self.index, revs)

1726

return dagop.headrevs(revs, self._uncheckedparentrevs)

1726

return dagop.headrevs(revs, self._uncheckedparentrevs)

1727

1728

def computephases(self, roots):

1728

def computephases(self, roots):

1729

return self.index.computephasesmapsets(roots)

1729

return self.index.computephasesmapsets(roots)

1730

1731

def _headrevs(self):

1731

def _headrevs(self):

1732

count = len(self)

1732

count = len(self)

1733

if not count:

1733

if not count:

1734

return [nullrev]

1734

return [nullrev]

1735

# we won't iter over filtered rev so nobody is a head at start

1735

# we won't iter over filtered rev so nobody is a head at start

1736

ishead = [0] * (count + 1)

1736

ishead = [0] * (count + 1)

1737

index = self.index

1737

index = self.index

1738

for r in self:

1738

for r in self:

1739

ishead[r] = 1 # I may be an head

1739

ishead[r] = 1 # I may be an head

1740

e = index[r]

1740

e = index[r]

1741

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

1741

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

1742

return [r for r, val in enumerate(ishead) if val]

1742

return [r for r, val in enumerate(ishead) if val]

1743

1744

def heads(self, start=None, stop=None):

1744

def heads(self, start=None, stop=None):

1745

"""return the list of all nodes that have no children

1745

"""return the list of all nodes that have no children

1746

1747

if start is specified, only heads that are descendants of

1747

if start is specified, only heads that are descendants of

1748

start will be returned

1748

start will be returned

1749

if stop is specified, it will consider all the revs from stop

1749

if stop is specified, it will consider all the revs from stop

1750

as if they had no children

1750

as if they had no children

1751

"""

1751

"""

1752

if start is None and stop is None:

1752

if start is None and stop is None:

1753

if not len(self):

1753

if not len(self):

1754

return [self.nullid]

1754

return [self.nullid]

1755

return [self.node(r) for r in self.headrevs()]

1755

return [self.node(r) for r in self.headrevs()]

1756

1757

if start is None:

1757

if start is None:

1758

start = nullrev

1758

start = nullrev

1759

else:

1759

else:

1760

start = self.rev(start)

1760

start = self.rev(start)

1761

1762

stoprevs = {self.rev(n) for n in stop or []}

1762

stoprevs = {self.rev(n) for n in stop or []}

1763

1764

revs = dagop.headrevssubset(

1764

revs = dagop.headrevssubset(

1765

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

1765

self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs

1766

)

1766

)

1767

1768

return [self.node(rev) for rev in revs]

1768

return [self.node(rev) for rev in revs]

1769

1770

def children(self, node):

1770

def children(self, node):

1771

"""find the children of a given node"""

1771

"""find the children of a given node"""

1772

c = []

1772

c = []

1773

p = self.rev(node)

1773

p = self.rev(node)

1774

for r in self.revs(start=p + 1):

1774

for r in self.revs(start=p + 1):

1775

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

1775

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

1776

if prevs:

1776

if prevs:

1777

for pr in prevs:

1777

for pr in prevs:

1778

if pr == p:

1778

if pr == p:

1779

c.append(self.node(r))

1779

c.append(self.node(r))

1780

elif p == nullrev:

1780

elif p == nullrev:

1781

c.append(self.node(r))

1781

c.append(self.node(r))

1782

return c

1782

return c

1783

1784

def commonancestorsheads(self, a, b):

1784

def commonancestorsheads(self, a, b):

1785

"""calculate all the heads of the common ancestors of nodes a and b"""

1785

"""calculate all the heads of the common ancestors of nodes a and b"""

1786

a, b = self.rev(a), self.rev(b)

1786

a, b = self.rev(a), self.rev(b)

1787

ancs = self._commonancestorsheads(a, b)

1787

ancs = self._commonancestorsheads(a, b)

1788

return pycompat.maplist(self.node, ancs)

1788

return pycompat.maplist(self.node, ancs)

1789

1790

def _commonancestorsheads(self, *revs):

1790

def _commonancestorsheads(self, *revs):

1791

"""calculate all the heads of the common ancestors of revs"""

1791

"""calculate all the heads of the common ancestors of revs"""

1792

try:

1792

try:

1793

ancs = self.index.commonancestorsheads(*revs)

1793

ancs = self.index.commonancestorsheads(*revs)

1794

except (AttributeError, OverflowError): # C implementation failed

1794

except (AttributeError, OverflowError): # C implementation failed

1795

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

1795

ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)

1796

return ancs

1796

return ancs

1797

1798

def isancestor(self, a, b):

1798

def isancestor(self, a, b):

1799

"""return True if node a is an ancestor of node b

1799

"""return True if node a is an ancestor of node b

1800

1801

A revision is considered an ancestor of itself."""

1801

A revision is considered an ancestor of itself."""

1802

a, b = self.rev(a), self.rev(b)

1802

a, b = self.rev(a), self.rev(b)

1803

return self.isancestorrev(a, b)

1803

return self.isancestorrev(a, b)

1804

1805

def isancestorrev(self, a, b):

1805

def isancestorrev(self, a, b):

1806

"""return True if revision a is an ancestor of revision b

1806

"""return True if revision a is an ancestor of revision b

1807

1808

A revision is considered an ancestor of itself.

1808

A revision is considered an ancestor of itself.

1809

1810

The implementation of this is trivial but the use of

1810

The implementation of this is trivial but the use of

1811

reachableroots is not."""

1811

reachableroots is not."""

1812

if a == nullrev:

1812

if a == nullrev:

1813

return True

1813

return True

1814

elif a == b:

1814

elif a == b:

1815

return True

1815

return True

1816

elif a > b:

1816

elif a > b:

1817

return False

1817

return False

1818

return bool(self.reachableroots(a, [b], [a], includepath=False))

1818

return bool(self.reachableroots(a, [b], [a], includepath=False))

1819

1820

def reachableroots(self, minroot, heads, roots, includepath=False):

1820

def reachableroots(self, minroot, heads, roots, includepath=False):

1821

"""return (heads(::(<roots> and <roots>::<heads>)))

1821

"""return (heads(::(<roots> and <roots>::<heads>)))

1822

1823

If includepath is True, return (<roots>::<heads>)."""

1823

If includepath is True, return (<roots>::<heads>)."""

1824

try:

1824

try:

1825

return self.index.reachableroots2(

1825

return self.index.reachableroots2(

1826

minroot, heads, roots, includepath

1826

minroot, heads, roots, includepath

1827

)

1827

)

1828

except AttributeError:

1828

except AttributeError:

1829

return dagop._reachablerootspure(

1829

return dagop._reachablerootspure(

1830

self.parentrevs, minroot, roots, heads, includepath

1830

self.parentrevs, minroot, roots, heads, includepath

1831

)

1831

)

1832

1833

def ancestor(self, a, b):

1833

def ancestor(self, a, b):

1834

"""calculate the "best" common ancestor of nodes a and b"""

1834

"""calculate the "best" common ancestor of nodes a and b"""

1835

1836

a, b = self.rev(a), self.rev(b)

1836

a, b = self.rev(a), self.rev(b)

1837

try:

1837

try:

1838

ancs = self.index.ancestors(a, b)

1838

ancs = self.index.ancestors(a, b)

1839

except (AttributeError, OverflowError):

1839

except (AttributeError, OverflowError):

1840

ancs = ancestor.ancestors(self.parentrevs, a, b)

1840

ancs = ancestor.ancestors(self.parentrevs, a, b)

1841

if ancs:

1841

if ancs:

1842

# choose a consistent winner when there's a tie

1842

# choose a consistent winner when there's a tie

1843

return min(map(self.node, ancs))

1843

return min(map(self.node, ancs))

1844

return self.nullid

1844

return self.nullid

1845

1846

def _match(self, id):

1846

def _match(self, id):

1847

if isinstance(id, int):

1847

if isinstance(id, int):

1848

# rev

1848

# rev

1849

return self.node(id)

1849

return self.node(id)

1850

if len(id) == self.nodeconstants.nodelen:

1850

if len(id) == self.nodeconstants.nodelen:

1851

# possibly a binary node

1851

# possibly a binary node

1852

# odds of a binary node being all hex in ASCII are 1 in 10**25

1852

# odds of a binary node being all hex in ASCII are 1 in 10**25

1853

try:

1853

try:

1854

node = id

1854

node = id

1855

self.rev(node) # quick search the index

1855

self.rev(node) # quick search the index

1856

return node

1856

return node

1857

except error.LookupError:

1857

except error.LookupError:

1858

pass # may be partial hex id

1858

pass # may be partial hex id

1859

try:

1859

try:

1860

# str(rev)

1860

# str(rev)

1861

rev = int(id)

1861

rev = int(id)

1862

if b"%d" % rev != id:

1862

if b"%d" % rev != id:

1863

raise ValueError

1863

raise ValueError

1864

if rev < 0:

1864

if rev < 0:

1865

rev = len(self) + rev

1865

rev = len(self) + rev

1866

if rev < 0 or rev >= len(self):

1866

if rev < 0 or rev >= len(self):

1867

raise ValueError

1867

raise ValueError

1868

return self.node(rev)

1868

return self.node(rev)

1869

except (ValueError, OverflowError):

1869

except (ValueError, OverflowError):

1870

pass

1870

pass

1871

if len(id) == 2 * self.nodeconstants.nodelen:

1871

if len(id) == 2 * self.nodeconstants.nodelen:

1872

try:

1872

try:

1873

# a full hex nodeid?

1873

# a full hex nodeid?

1874

node = bin(id)

1874

node = bin(id)

1875

self.rev(node)

1875

self.rev(node)

1876

return node

1876

return node

1877

except (binascii.Error, error.LookupError):

1877

except (binascii.Error, error.LookupError):

1878

pass

1878

pass

1879

1880

def _partialmatch(self, id):

1880

def _partialmatch(self, id):

1881

# we don't care wdirfilenodeids as they should be always full hash

1881

# we don't care wdirfilenodeids as they should be always full hash

1882

maybewdir = self.nodeconstants.wdirhex.startswith(id)

1882

maybewdir = self.nodeconstants.wdirhex.startswith(id)

1883

ambiguous = False

1883

ambiguous = False

1884

try:

1884

try:

1885

partial = self.index.partialmatch(id)

1885

partial = self.index.partialmatch(id)

1886

if partial and self.hasnode(partial):

1886

if partial and self.hasnode(partial):

1887

if maybewdir:

1887

if maybewdir:

1888

# single 'ff...' match in radix tree, ambiguous with wdir

1888

# single 'ff...' match in radix tree, ambiguous with wdir

1889

ambiguous = True

1889

ambiguous = True

1890

else:

1890

else:

1891

return partial

1891

return partial

1892

elif maybewdir:

1892

elif maybewdir:

1893

# no 'ff...' match in radix tree, wdir identified

1893

# no 'ff...' match in radix tree, wdir identified

1894

raise error.WdirUnsupported

1894

raise error.WdirUnsupported

1895

else:

1895

else:

1896

return None

1896

return None

1897

except error.RevlogError:

1897

except error.RevlogError:

1898

# parsers.c radix tree lookup gave multiple matches

1898

# parsers.c radix tree lookup gave multiple matches

1899

# fast path: for unfiltered changelog, radix tree is accurate

1899

# fast path: for unfiltered changelog, radix tree is accurate

1900

if not getattr(self, 'filteredrevs', None):

1900

if not getattr(self, 'filteredrevs', None):

1901

ambiguous = True

1901

ambiguous = True

1902

# fall through to slow path that filters hidden revisions

1902

# fall through to slow path that filters hidden revisions

1903

except (AttributeError, ValueError):

1903

except (AttributeError, ValueError):

1904

# we are pure python, or key is not hex

1904

# we are pure python, or key is not hex

1905

pass

1905

pass

1906

if ambiguous:

1906

if ambiguous:

1907

raise error.AmbiguousPrefixLookupError(

1907

raise error.AmbiguousPrefixLookupError(

1908

id, self.display_id, _(b'ambiguous identifier')

1908

id, self.display_id, _(b'ambiguous identifier')

1909

)

1909

)

1910

1911

if id in self._pcache:

1911

if id in self._pcache:

1912

return self._pcache[id]

1912

return self._pcache[id]

1913

1914

if len(id) <= 40:

1914

if len(id) <= 40:

1915

# hex(node)[:...]

1915

# hex(node)[:...]

1916

l = len(id) // 2 * 2 # grab an even number of digits

1916

l = len(id) // 2 * 2 # grab an even number of digits

1917

try:

1917

try:

1918

# we're dropping the last digit, so let's check that it's hex,

1918

# we're dropping the last digit, so let's check that it's hex,

1919

# to avoid the expensive computation below if it's not

1919

# to avoid the expensive computation below if it's not

1920

if len(id) % 2 > 0:

1920

if len(id) % 2 > 0:

1921

if not (id[-1] in hexdigits):

1921

if not (id[-1] in hexdigits):

1922

return None

1922

return None

1923

prefix = bin(id[:l])

1923

prefix = bin(id[:l])

1924

except binascii.Error:

1924

except binascii.Error:

1925

pass

1925

pass

1926

else:

1926

else:

1927

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

1927

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

1928

nl = [

1928

nl = [

1929

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

1929

n for n in nl if hex(n).startswith(id) and self.hasnode(n)

1930

]

1930

]

1931

if self.nodeconstants.nullhex.startswith(id):

1931

if self.nodeconstants.nullhex.startswith(id):

1932

nl.append(self.nullid)

1932

nl.append(self.nullid)

1933

if len(nl) > 0:

1933

if len(nl) > 0:

1934

if len(nl) == 1 and not maybewdir:

1934

if len(nl) == 1 and not maybewdir:

1935

self._pcache[id] = nl[0]

1935

self._pcache[id] = nl[0]

1936

return nl[0]

1936

return nl[0]

1937

raise error.AmbiguousPrefixLookupError(

1937

raise error.AmbiguousPrefixLookupError(

1938

id, self.display_id, _(b'ambiguous identifier')

1938

id, self.display_id, _(b'ambiguous identifier')

1939

)

1939

)

1940

if maybewdir:

1940

if maybewdir:

1941

raise error.WdirUnsupported

1941

raise error.WdirUnsupported

1942

return None

1942

return None

1943

1944

def lookup(self, id):

1944

def lookup(self, id):

1945

"""locate a node based on:

1945

"""locate a node based on:

1946

- revision number or str(revision number)

1946

- revision number or str(revision number)

1947

- nodeid or subset of hex nodeid

1947

- nodeid or subset of hex nodeid

1948

"""

1948

"""

1949

n = self._match(id)

1949

n = self._match(id)

1950

if n is not None:

1950

if n is not None:

1951

return n

1951

return n

1952

n = self._partialmatch(id)

1952

n = self._partialmatch(id)

1953

if n:

1953

if n:

1954

return n

1954

return n

1955

1956

raise error.LookupError(id, self.display_id, _(b'no match found'))

1956

raise error.LookupError(id, self.display_id, _(b'no match found'))

1957

1958

def shortest(self, node, minlength=1):

1958

def shortest(self, node, minlength=1):

1959

"""Find the shortest unambiguous prefix that matches node."""

1959

"""Find the shortest unambiguous prefix that matches node."""

1960

1961

def isvalid(prefix):

1961

def isvalid(prefix):

1962

try:

1962

try:

1963

matchednode = self._partialmatch(prefix)

1963

matchednode = self._partialmatch(prefix)

1964

except error.AmbiguousPrefixLookupError:

1964

except error.AmbiguousPrefixLookupError:

1965

return False

1965

return False

1966

except error.WdirUnsupported:

1966

except error.WdirUnsupported:

1967

# single 'ff...' match

1967

# single 'ff...' match

1968

return True

1968

return True

1969

if matchednode is None:

1969

if matchednode is None:

1970

raise error.LookupError(node, self.display_id, _(b'no node'))

1970

raise error.LookupError(node, self.display_id, _(b'no node'))

1971

return True

1971

return True

1972

1973

def maybewdir(prefix):

1973

def maybewdir(prefix):

1974

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

1974

return all(c == b'f' for c in pycompat.iterbytestr(prefix))

1975

1976

hexnode = hex(node)

1976

hexnode = hex(node)

1977

1978

def disambiguate(hexnode, minlength):

1978

def disambiguate(hexnode, minlength):

1979

"""Disambiguate against wdirid."""

1979

"""Disambiguate against wdirid."""

1980

for length in range(minlength, len(hexnode) + 1):

1980

for length in range(minlength, len(hexnode) + 1):

1981

prefix = hexnode[:length]

1981

prefix = hexnode[:length]

1982

if not maybewdir(prefix):

1982

if not maybewdir(prefix):

1983

return prefix

1983

return prefix

1984

1985

if not getattr(self, 'filteredrevs', None):

1985

if not getattr(self, 'filteredrevs', None):

1986

try:

1986

try:

1987

length = max(self.index.shortest(node), minlength)

1987

length = max(self.index.shortest(node), minlength)

1988

return disambiguate(hexnode, length)

1988

return disambiguate(hexnode, length)

1989

except error.RevlogError:

1989

except error.RevlogError:

1990

if node != self.nodeconstants.wdirid:

1990

if node != self.nodeconstants.wdirid:

1991

raise error.LookupError(

1991

raise error.LookupError(

1992

node, self.display_id, _(b'no node')

1992

node, self.display_id, _(b'no node')

1993

)

1993

)

1994

except AttributeError:

1994

except AttributeError:

1995

# Fall through to pure code

1995

# Fall through to pure code

1996

pass

1996

pass

1997

1998

if node == self.nodeconstants.wdirid:

1998

if node == self.nodeconstants.wdirid:

1999

for length in range(minlength, len(hexnode) + 1):

1999

for length in range(minlength, len(hexnode) + 1):

2000

prefix = hexnode[:length]

2000

prefix = hexnode[:length]

2001

if isvalid(prefix):

2001

if isvalid(prefix):

2002

return prefix

2002

return prefix

2003

2004

for length in range(minlength, len(hexnode) + 1):

2004

for length in range(minlength, len(hexnode) + 1):

2005

prefix = hexnode[:length]

2005

prefix = hexnode[:length]

2006

if isvalid(prefix):

2006

if isvalid(prefix):

2007

return disambiguate(hexnode, length)

2007

return disambiguate(hexnode, length)

2008

2009

def cmp(self, node, text):

2009

def cmp(self, node, text):

2010

"""compare text with a given file revision

2010

"""compare text with a given file revision

2011

2012

returns True if text is different than what is stored.

2012

returns True if text is different than what is stored.

2013

"""

2013

"""

2014

p1, p2 = self.parents(node)

2014

p1, p2 = self.parents(node)

2015

return storageutil.hashrevisionsha1(text, p1, p2) != node

2015

return storageutil.hashrevisionsha1(text, p1, p2) != node

2016

2017

def _getsegmentforrevs(self, startrev, endrev):

2017

def _getsegmentforrevs(self, startrev, endrev):

2018

"""Obtain a segment of raw data corresponding to a range of revisions.

2018

"""Obtain a segment of raw data corresponding to a range of revisions.

2019

2020

Accepts the start and end revisions and an optional already-open

2020

Accepts the start and end revisions and an optional already-open

2021

file handle to be used for reading. If the file handle is read, its

2021

file handle to be used for reading. If the file handle is read, its

2022

seek position will not be preserved.

2022

seek position will not be preserved.

2023

2024

Requests for data may be satisfied by a cache.

2024

Requests for data may be satisfied by a cache.

2025

2026

Returns a 2-tuple of (offset, data) for the requested range of

2026

Returns a 2-tuple of (offset, data) for the requested range of

2027

revisions. Offset is the integer offset from the beginning of the

2027

revisions. Offset is the integer offset from the beginning of the

2028

revlog and data is a str or buffer of the raw byte data.

2028

revlog and data is a str or buffer of the raw byte data.

2029

2030

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

2030

Callers will need to call ``self.start(rev)`` and ``self.length(rev)``

2031

to determine where each revision's data begins and ends.

2031

to determine where each revision's data begins and ends.

2032

"""

2032

"""

2033

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

2033

# Inlined self.start(startrev) & self.end(endrev) for perf reasons

2034

# (functions are expensive).

2034

# (functions are expensive).

2035

index = self.index

2035

index = self.index

2036

istart = index[startrev]

2036

istart = index[startrev]

2037

start = int(istart[0] >> 16)

2037

start = int(istart[0] >> 16)

2038

if startrev == endrev:

2038

if startrev == endrev:

2039

end = start + istart[1]

2039

end = start + istart[1]

2040

else:

2040

else:

2041

iend = index[endrev]

2041

iend = index[endrev]

2042

end = int(iend[0] >> 16) + iend[1]

2042

end = int(iend[0] >> 16) + iend[1]

2043

2044

if self._inline:

2044

if self._inline:

2045

start += (startrev + 1) * self.index.entry_size

2045

start += (startrev + 1) * self.index.entry_size

2046

end += (endrev + 1) * self.index.entry_size

2046

end += (endrev + 1) * self.index.entry_size

2047

length = end - start

2047

length = end - start

2048

2049

return start, self._segmentfile.read_chunk(start, length)

2049

return start, self._segmentfile.read_chunk(start, length)

2050

2051

def _chunk(self, rev):

2051

def _chunk(self, rev):

2052

"""Obtain a single decompressed chunk for a revision.

2052

"""Obtain a single decompressed chunk for a revision.

2053

2054

Accepts an integer revision and an optional already-open file handle

2054

Accepts an integer revision and an optional already-open file handle

2055

to be used for reading. If used, the seek position of the file will not

2055

to be used for reading. If used, the seek position of the file will not

2056

be preserved.

2056

be preserved.

2057

2058

Returns a str holding uncompressed data for the requested revision.

2058

Returns a str holding uncompressed data for the requested revision.

2059

"""

2059

"""

2060

compression_mode = self.index[rev][10]

2060

compression_mode = self.index[rev][10]

2061

data = self._getsegmentforrevs(rev, rev)[1]

2061

data = self._getsegmentforrevs(rev, rev)[1]

2062

if compression_mode == COMP_MODE_PLAIN:

2062

if compression_mode == COMP_MODE_PLAIN:

2063

return data

2063

return data

2064

elif compression_mode == COMP_MODE_DEFAULT:

2064

elif compression_mode == COMP_MODE_DEFAULT:

2065

return self._decompressor(data)

2065

return self._decompressor(data)

2066

elif compression_mode == COMP_MODE_INLINE:

2066

elif compression_mode == COMP_MODE_INLINE:

2067

return self.decompress(data)

2067

return self.decompress(data)

2068

else:

2068

else:

2069

msg = b'unknown compression mode %d'

2069

msg = b'unknown compression mode %d'

2070

msg %= compression_mode

2070

msg %= compression_mode

2071

raise error.RevlogError(msg)

2071

raise error.RevlogError(msg)

2072

2073

def _chunks(self, revs, targetsize=None):

2073

def _chunks(self, revs, targetsize=None):

2074

"""Obtain decompressed chunks for the specified revisions.

2074

"""Obtain decompressed chunks for the specified revisions.

2075

2076

Accepts an iterable of numeric revisions that are assumed to be in

2076

Accepts an iterable of numeric revisions that are assumed to be in

2077

ascending order. Also accepts an optional already-open file handle

2077

ascending order. Also accepts an optional already-open file handle

2078

to be used for reading. If used, the seek position of the file will

2078

to be used for reading. If used, the seek position of the file will

2079

not be preserved.

2079

not be preserved.

2080

2081

This function is similar to calling ``self._chunk()`` multiple times,

2081

This function is similar to calling ``self._chunk()`` multiple times,

2082

but is faster.

2082

but is faster.

2083

2084

Returns a list with decompressed data for each requested revision.

2084

Returns a list with decompressed data for each requested revision.

2085

"""

2085

"""

2086

if not revs:

2086

if not revs:

2087

return []

2087

return []

2088

start = self.start

2088

start = self.start

2089

length = self.length

2089

length = self.length

2090

inline = self._inline

2090

inline = self._inline

2091

iosize = self.index.entry_size

2091

iosize = self.index.entry_size

2092

buffer = util.buffer

2092

buffer = util.buffer

2093

2094

l = []

2094

l = []

2095

ladd = l.append

2095

ladd = l.append

2096

2097

if not self.data_config.with_sparse_read:

2097

if not self.data_config.with_sparse_read:

2098

slicedchunks = (revs,)

2098

slicedchunks = (revs,)

2099

else:

2099

else:

2100

slicedchunks = deltautil.slicechunk(

2100

slicedchunks = deltautil.slicechunk(

2101

self, revs, targetsize=targetsize

2101

self, revs, targetsize=targetsize

2102

)

2102

)

2103

2104

for revschunk in slicedchunks:

2104

for revschunk in slicedchunks:

2105

firstrev = revschunk[0]

2105

firstrev = revschunk[0]

2106

# Skip trailing revisions with empty diff

2106

# Skip trailing revisions with empty diff

2107

for lastrev in revschunk[::-1]:

2107

for lastrev in revschunk[::-1]:

2108

if length(lastrev) != 0:

2108

if length(lastrev) != 0:

2109

break

2109

break

2110

2111

try:

2111

try:

2112

offset, data = self._getsegmentforrevs(firstrev, lastrev)

2112

offset, data = self._getsegmentforrevs(firstrev, lastrev)

2113

except OverflowError:

2113

except OverflowError:

2114

# issue4215 - we can't cache a run of chunks greater than

2114

# issue4215 - we can't cache a run of chunks greater than

2115

# 2G on Windows

2115

# 2G on Windows

2116

return [self._chunk(rev) for rev in revschunk]

2116

return [self._chunk(rev) for rev in revschunk]

2117

2118

decomp = self.decompress

2118

decomp = self.decompress

2119

# self._decompressor might be None, but will not be used in that case

2119

# self._decompressor might be None, but will not be used in that case

2120

def_decomp = self._decompressor

2120

def_decomp = self._decompressor

2121

for rev in revschunk:

2121

for rev in revschunk:

2122

chunkstart = start(rev)

2122

chunkstart = start(rev)

2123

if inline:

2123

if inline:

2124

chunkstart += (rev + 1) * iosize

2124

chunkstart += (rev + 1) * iosize

2125

chunklength = length(rev)

2125

chunklength = length(rev)

2126

comp_mode = self.index[rev][10]

2126

comp_mode = self.index[rev][10]

2127

c = buffer(data, chunkstart - offset, chunklength)

2127

c = buffer(data, chunkstart - offset, chunklength)

2128

if comp_mode == COMP_MODE_PLAIN:

2128

if comp_mode == COMP_MODE_PLAIN:

2129

ladd(c)

2129

ladd(c)

2130

elif comp_mode == COMP_MODE_INLINE:

2130

elif comp_mode == COMP_MODE_INLINE:

2131

ladd(decomp(c))

2131

ladd(decomp(c))

2132

elif comp_mode == COMP_MODE_DEFAULT:

2132

elif comp_mode == COMP_MODE_DEFAULT:

2133

ladd(def_decomp(c))

2133

ladd(def_decomp(c))

2134

else:

2134

else:

2135

msg = b'unknown compression mode %d'

2135

msg = b'unknown compression mode %d'

2136

msg %= comp_mode

2136

msg %= comp_mode

2137

raise error.RevlogError(msg)

2137

raise error.RevlogError(msg)

2138

2139

return l

2139

return l

2140

2141

def deltaparent(self, rev):

2141

def deltaparent(self, rev):

2142

"""return deltaparent of the given revision"""

2142

"""return deltaparent of the given revision"""

2143

base = self.index[rev][3]

2143

base = self.index[rev][3]

2144

if base == rev:

2144

if base == rev:

2145

return nullrev

2145

return nullrev

2146

elif self.delta_config.general_delta:

2146

elif self.delta_config.general_delta:

2147

return base

2147

return base

2148

else:

2148

else:

2149

return rev - 1

2149

return rev - 1

2150

2151

def issnapshot(self, rev):

2151

def issnapshot(self, rev):

2152

"""tells whether rev is a snapshot"""

2152

"""tells whether rev is a snapshot"""

2153

if not self.delta_config.sparse_revlog:

2153

if not self.delta_config.sparse_revlog:

2154

return self.deltaparent(rev) == nullrev

2154

return self.deltaparent(rev) == nullrev

2155

elif hasattr(self.index, 'issnapshot'):

2155

elif hasattr(self.index, 'issnapshot'):

2156

# directly assign the method to cache the testing and access

2156

# directly assign the method to cache the testing and access

2157

self.issnapshot = self.index.issnapshot

2157

self.issnapshot = self.index.issnapshot

2158

return self.issnapshot(rev)

2158

return self.issnapshot(rev)

2159

if rev == nullrev:

2159

if rev == nullrev:

2160

return True

2160

return True

2161

entry = self.index[rev]

2161

entry = self.index[rev]

2162

base = entry[3]

2162

base = entry[3]

2163

if base == rev:

2163

if base == rev:

2164

return True

2164

return True

2165

if base == nullrev:

2165

if base == nullrev:

2166

return True

2166

return True

2167

p1 = entry[5]

2167

p1 = entry[5]

2168

while self.length(p1) == 0:

2168

while self.length(p1) == 0:

2169

b = self.deltaparent(p1)

2169

b = self.deltaparent(p1)

2170

if b == p1:

2170

if b == p1:

2171

break

2171

break

2172

p1 = b

2172

p1 = b

2173

p2 = entry[6]

2173

p2 = entry[6]

2174

while self.length(p2) == 0:

2174

while self.length(p2) == 0:

2175

b = self.deltaparent(p2)

2175

b = self.deltaparent(p2)

2176

if b == p2:

2176

if b == p2:

2177

break

2177

break

2178

p2 = b

2178

p2 = b

2179

if base == p1 or base == p2:

2179

if base == p1 or base == p2:

2180

return False

2180

return False

2181

return self.issnapshot(base)

2181

return self.issnapshot(base)

2182

2183

def snapshotdepth(self, rev):

2183

def snapshotdepth(self, rev):

2184

"""number of snapshot in the chain before this one"""

2184

"""number of snapshot in the chain before this one"""

2185

if not self.issnapshot(rev):

2185

if not self.issnapshot(rev):

2186

raise error.ProgrammingError(b'revision %d not a snapshot')

2186

raise error.ProgrammingError(b'revision %d not a snapshot')

2187

return len(self._deltachain(rev)[0]) - 1

2187

return len(self._deltachain(rev)[0]) - 1

2188

2189

def revdiff(self, rev1, rev2):

2189

def revdiff(self, rev1, rev2):

2190

"""return or calculate a delta between two revisions

2190

"""return or calculate a delta between two revisions

2191

2192

The delta calculated is in binary form and is intended to be written to

2192

The delta calculated is in binary form and is intended to be written to

2193

revlog data directly. So this function needs raw revision data.

2193

revlog data directly. So this function needs raw revision data.

2194

"""

2194

"""

2195

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

2195

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

2196

return bytes(self._chunk(rev2))

2196

return bytes(self._chunk(rev2))

2197

2198

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

2198

return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))

2199

2200

def revision(self, nodeorrev):

2200

def revision(self, nodeorrev):

2201

"""return an uncompressed revision of a given node or revision

2201

"""return an uncompressed revision of a given node or revision

2202

number.

2202

number.

2203

"""

2203

"""

2204

return self._revisiondata(nodeorrev)

2204

return self._revisiondata(nodeorrev)

2205

2206

def sidedata(self, nodeorrev):

2206

def sidedata(self, nodeorrev):

2207

"""a map of extra data related to the changeset but not part of the hash

2207

"""a map of extra data related to the changeset but not part of the hash

2208

2209

This function currently return a dictionary. However, more advanced

2209

This function currently return a dictionary. However, more advanced

2210

mapping object will likely be used in the future for a more

2210

mapping object will likely be used in the future for a more

2211

efficient/lazy code.

2211

efficient/lazy code.

2212

"""

2212

"""

2213

# deal with <nodeorrev> argument type

2213

# deal with <nodeorrev> argument type

2214

if isinstance(nodeorrev, int):

2214

if isinstance(nodeorrev, int):

2215

rev = nodeorrev

2215

rev = nodeorrev

2216

else:

2216

else:

2217

rev = self.rev(nodeorrev)

2217

rev = self.rev(nodeorrev)

2218

return self._sidedata(rev)

2218

return self._sidedata(rev)

2219

2220

def _revisiondata(self, nodeorrev, raw=False):

2220

def _revisiondata(self, nodeorrev, raw=False):

2221

# deal with <nodeorrev> argument type

2221

# deal with <nodeorrev> argument type

2222

if isinstance(nodeorrev, int):

2222

if isinstance(nodeorrev, int):

2223

rev = nodeorrev

2223

rev = nodeorrev

2224

node = self.node(rev)

2224

node = self.node(rev)

2225

else:

2225

else:

2226

node = nodeorrev

2226

node = nodeorrev

2227

rev = None

2227

rev = None

2228

2229

# fast path the special `nullid` rev

2229

# fast path the special `nullid` rev

2230

if node == self.nullid:

2230

if node == self.nullid:

2231

return b""

2231

return b""

2232

2233

# ``rawtext`` is the text as stored inside the revlog. Might be the

2233

# ``rawtext`` is the text as stored inside the revlog. Might be the

2234

# revision or might need to be processed to retrieve the revision.

2234

# revision or might need to be processed to retrieve the revision.

2235

rev, rawtext, validated = self._rawtext(node, rev)

2235

rev, rawtext, validated = self._rawtext(node, rev)

2236

2237

if raw and validated:

2237

if raw and validated:

2238

# if we don't want to process the raw text and that raw

2238

# if we don't want to process the raw text and that raw

2239

# text is cached, we can exit early.

2239

# text is cached, we can exit early.

2240

return rawtext

2240

return rawtext

2241

if rev is None:

2241

if rev is None:

2242

rev = self.rev(node)

2242

rev = self.rev(node)

2243

# the revlog's flag for this revision

2243

# the revlog's flag for this revision

2244

# (usually alter its state or content)

2244

# (usually alter its state or content)

2245

flags = self.flags(rev)

2245

flags = self.flags(rev)

2246

2247

if validated and flags == REVIDX_DEFAULT_FLAGS:

2247

if validated and flags == REVIDX_DEFAULT_FLAGS:

2248

# no extra flags set, no flag processor runs, text = rawtext

2248

# no extra flags set, no flag processor runs, text = rawtext

2249

return rawtext

2249

return rawtext

2250

2251

if raw:

2251

if raw:

2252

validatehash = flagutil.processflagsraw(self, rawtext, flags)

2252

validatehash = flagutil.processflagsraw(self, rawtext, flags)

2253

text = rawtext

2253

text = rawtext

2254

else:

2254

else:

2255

r = flagutil.processflagsread(self, rawtext, flags)

2255

r = flagutil.processflagsread(self, rawtext, flags)

2256

text, validatehash = r

2256

text, validatehash = r

2257

if validatehash:

2257

if validatehash:

2258

self.checkhash(text, node, rev=rev)

2258

self.checkhash(text, node, rev=rev)

2259

if not validated:

2259

if not validated:

2260

self._revisioncache = (node, rev, rawtext)

2260

self._revisioncache = (node, rev, rawtext)

2261

2262

return text

2262

return text

2263

2264

def _rawtext(self, node, rev):

2264

def _rawtext(self, node, rev):

2265

"""return the possibly unvalidated rawtext for a revision

2265

"""return the possibly unvalidated rawtext for a revision

2266

2267

returns (rev, rawtext, validated)

2267

returns (rev, rawtext, validated)

2268

"""

2268

"""

2269

2270

# revision in the cache (could be useful to apply delta)

2270

# revision in the cache (could be useful to apply delta)

2271

cachedrev = None

2271

cachedrev = None

2272

# An intermediate text to apply deltas to

2272

# An intermediate text to apply deltas to

2273

basetext = None

2273

basetext = None

2274

2275

# Check if we have the entry in cache

2275

# Check if we have the entry in cache

2276

# The cache entry looks like (node, rev, rawtext)

2276

# The cache entry looks like (node, rev, rawtext)

2277

if self._revisioncache:

2277

if self._revisioncache:

2278

if self._revisioncache[0] == node:

2278

if self._revisioncache[0] == node:

2279

return (rev, self._revisioncache[2], True)

2279

return (rev, self._revisioncache[2], True)

2280

cachedrev = self._revisioncache[1]

2280

cachedrev = self._revisioncache[1]

2281

2282

if rev is None:

2282

if rev is None:

2283

rev = self.rev(node)

2283

rev = self.rev(node)

2284

2285

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

2285

chain, stopped = self._deltachain(rev, stoprev=cachedrev)

2286

if stopped:

2286

if stopped:

2287

basetext = self._revisioncache[2]

2287

basetext = self._revisioncache[2]

2288

2289

# drop cache to save memory, the caller is expected to

2289

# drop cache to save memory, the caller is expected to

2290

# update self._revisioncache after validating the text

2290

# update self._revisioncache after validating the text

2291

self._revisioncache = None

2291

self._revisioncache = None

2292

2293

targetsize = None

2293

targetsize = None

2294

rawsize = self.index[rev][2]

2294

rawsize = self.index[rev][2]

2295

if 0 <= rawsize:

2295

if 0 <= rawsize:

2296

targetsize = 4 * rawsize

2296

targetsize = 4 * rawsize

2297

2298

bins = self._chunks(chain, targetsize=targetsize)

2298

bins = self._chunks(chain, targetsize=targetsize)

2299

if basetext is None:

2299

if basetext is None:

2300

basetext = bytes(bins[0])

2300

basetext = bytes(bins[0])

2301

bins = bins[1:]

2301

bins = bins[1:]

2302

2303

rawtext = mdiff.patches(basetext, bins)

2303

rawtext = mdiff.patches(basetext, bins)

2304

del basetext # let us have a chance to free memory early

2304

del basetext # let us have a chance to free memory early

2305

return (rev, rawtext, False)

2305

return (rev, rawtext, False)

2306

2307

def _sidedata(self, rev):

2307

def _sidedata(self, rev):

2308

"""Return the sidedata for a given revision number."""

2308

"""Return the sidedata for a given revision number."""

2309

index_entry = self.index[rev]

2309

index_entry = self.index[rev]

2310

sidedata_offset = index_entry[8]

2310

sidedata_offset = index_entry[8]

2311

sidedata_size = index_entry[9]

2311

sidedata_size = index_entry[9]

2312

2313

if self._inline:

2313

if self._inline:

2314

sidedata_offset += self.index.entry_size * (1 + rev)

2314

sidedata_offset += self.index.entry_size * (1 + rev)

2315

if sidedata_size == 0:

2315

if sidedata_size == 0:

2316

return {}

2316

return {}

2317

2318

if self._docket.sidedata_end < sidedata_offset + sidedata_size:

2318

if self._docket.sidedata_end < sidedata_offset + sidedata_size:

2319

filename = self._sidedatafile

2319

filename = self._sidedatafile

2320

end = self._docket.sidedata_end

2320

end = self._docket.sidedata_end

2321

offset = sidedata_offset

2321

offset = sidedata_offset

2322

length = sidedata_size

2322

length = sidedata_size

2323

m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)

2323

m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)

2324

raise error.RevlogError(m)

2324

raise error.RevlogError(m)

2325

2326

comp_segment = self._segmentfile_sidedata.read_chunk(

2326

comp_segment = self._segmentfile_sidedata.read_chunk(

2327

sidedata_offset, sidedata_size

2327

sidedata_offset, sidedata_size

2328

)

2328

)

2329

2330

comp = self.index[rev][11]

2330

comp = self.index[rev][11]

2331

if comp == COMP_MODE_PLAIN:

2331

if comp == COMP_MODE_PLAIN:

2332

segment = comp_segment

2332

segment = comp_segment

2333

elif comp == COMP_MODE_DEFAULT:

2333

elif comp == COMP_MODE_DEFAULT:

2334

segment = self._decompressor(comp_segment)

2334

segment = self._decompressor(comp_segment)

2335

elif comp == COMP_MODE_INLINE:

2335

elif comp == COMP_MODE_INLINE:

2336

segment = self.decompress(comp_segment)

2336

segment = self.decompress(comp_segment)

2337

else:

2337

else:

2338

msg = b'unknown compression mode %d'

2338

msg = b'unknown compression mode %d'

2339

msg %= comp

2339

msg %= comp

2340

raise error.RevlogError(msg)

2340

raise error.RevlogError(msg)

2341

2342

sidedata = sidedatautil.deserialize_sidedata(segment)

2342

sidedata = sidedatautil.deserialize_sidedata(segment)

2343

return sidedata

2343

return sidedata

2344

2345

def rawdata(self, nodeorrev):

2345

def rawdata(self, nodeorrev):

2346

"""return an uncompressed raw data of a given node or revision number."""

2346

"""return an uncompressed raw data of a given node or revision number."""

2347

return self._revisiondata(nodeorrev, raw=True)

2347

return self._revisiondata(nodeorrev, raw=True)

2348

2349

def hash(self, text, p1, p2):

2349

def hash(self, text, p1, p2):

2350

"""Compute a node hash.

2350

"""Compute a node hash.

2351

2352

Available as a function so that subclasses can replace the hash

2352

Available as a function so that subclasses can replace the hash

2353

as needed.

2353

as needed.

2354

"""

2354

"""

2355

return storageutil.hashrevisionsha1(text, p1, p2)

2355

return storageutil.hashrevisionsha1(text, p1, p2)

2356

2357

def checkhash(self, text, node, p1=None, p2=None, rev=None):

2357

def checkhash(self, text, node, p1=None, p2=None, rev=None):

2358

"""Check node hash integrity.

2358

"""Check node hash integrity.

2359

2360

Available as a function so that subclasses can extend hash mismatch

2360

Available as a function so that subclasses can extend hash mismatch

2361

behaviors as needed.

2361

behaviors as needed.

2362

"""

2362

"""

2363

try:

2363

try:

2364

if p1 is None and p2 is None:

2364

if p1 is None and p2 is None:

2365

p1, p2 = self.parents(node)

2365

p1, p2 = self.parents(node)

2366

if node != self.hash(text, p1, p2):

2366

if node != self.hash(text, p1, p2):

2367

# Clear the revision cache on hash failure. The revision cache

2367

# Clear the revision cache on hash failure. The revision cache

2368

# only stores the raw revision and clearing the cache does have

2368

# only stores the raw revision and clearing the cache does have

2369

# the side-effect that we won't have a cache hit when the raw

2369

# the side-effect that we won't have a cache hit when the raw

2370

# revision data is accessed. But this case should be rare and

2370

# revision data is accessed. But this case should be rare and

2371

# it is extra work to teach the cache about the hash

2371

# it is extra work to teach the cache about the hash

2372

# verification state.

2372

# verification state.

2373

if self._revisioncache and self._revisioncache[0] == node:

2373

if self._revisioncache and self._revisioncache[0] == node:

2374

self._revisioncache = None

2374

self._revisioncache = None

2375

2376

revornode = rev

2376

revornode = rev

2377

if revornode is None:

2377

if revornode is None:

2378

revornode = templatefilters.short(hex(node))

2378

revornode = templatefilters.short(hex(node))

2379

raise error.RevlogError(

2379

raise error.RevlogError(

2380

_(b"integrity check failed on %s:%s")

2380

_(b"integrity check failed on %s:%s")

2381

% (self.display_id, pycompat.bytestr(revornode))

2381

% (self.display_id, pycompat.bytestr(revornode))

2382

)

2382

)

2383

except error.RevlogError:

2383

except error.RevlogError:

2384

if self.feature_config.censorable and storageutil.iscensoredtext(

2384

if self.feature_config.censorable and storageutil.iscensoredtext(

2385

text

2385

text

2386

):

2386

):

2387

raise error.CensoredNodeError(self.display_id, node, text)

2387

raise error.CensoredNodeError(self.display_id, node, text)

2388

raise

2388

raise

2389

2390

@property

2390

@property

2391

def _split_index_file(self):

2391

def _split_index_file(self):

2392

"""the path where to expect the index of an ongoing splitting operation

2392

"""the path where to expect the index of an ongoing splitting operation

2393

2394

The file will only exist if a splitting operation is in progress, but

2394

The file will only exist if a splitting operation is in progress, but

2395

it is always expected at the same location."""

2395

it is always expected at the same location."""

2396

parts = self.radix.split(b'/')

2396

parts = self.radix.split(b'/')

2397

if len(parts) > 1:

2397

if len(parts) > 1:

2398

# adds a '-s' prefix to the ``data/` or `meta/` base

2398

# adds a '-s' prefix to the ``data/` or `meta/` base

2399

head = parts[0] + b'-s'

2399

head = parts[0] + b'-s'

2400

mids = parts[1:-1]

2400

mids = parts[1:-1]

2401

tail = parts[-1] + b'.i'

2401

tail = parts[-1] + b'.i'

2402

pieces = [head] + mids + [tail]

2402

pieces = [head] + mids + [tail]

2403

return b'/'.join(pieces)

2403

return b'/'.join(pieces)

2404

else:

2404

else:

2405

# the revlog is stored at the root of the store (changelog or

2405

# the revlog is stored at the root of the store (changelog or

2406

# manifest), no risk of collision.

2406

# manifest), no risk of collision.

2407

return self.radix + b'.i.s'

2407

return self.radix + b'.i.s'

2408

2409

def _enforceinlinesize(self, tr, side_write=True):

2409

def _enforceinlinesize(self, tr, side_write=True):

2410

"""Check if the revlog is too big for inline and convert if so.

2410

"""Check if the revlog is too big for inline and convert if so.

2411

2412

This should be called after revisions are added to the revlog. If the

2412

This should be called after revisions are added to the revlog. If the

2413

revlog has grown too large to be an inline revlog, it will convert it

2413

revlog has grown too large to be an inline revlog, it will convert it

2414

to use multiple index and data files.

2414

to use multiple index and data files.

2415

"""

2415

"""

2416

tiprev = len(self) - 1

2416

tiprev = len(self) - 1

2417

total_size = self.start(tiprev) + self.length(tiprev)

2417

total_size = self.start(tiprev) + self.length(tiprev)

2418

if not self._inline or total_size < _maxinline:

2418

if not self._inline or total_size < _maxinline:

2419

return

2419

return

2420

2421

troffset = tr.findoffset(self._indexfile)

2421

troffset = tr.findoffset(self._indexfile)

2422

if troffset is None:

2422

if troffset is None:

2423

raise error.RevlogError(

2423

raise error.RevlogError(

2424

_(b"%s not found in the transaction") % self._indexfile

2424

_(b"%s not found in the transaction") % self._indexfile

2425

)

2425

)

2426

if troffset:

2426

if troffset:

2427

tr.addbackup(self._indexfile, for_offset=True)

2427

tr.addbackup(self._indexfile, for_offset=True)

2428

tr.add(self._datafile, 0)

2428

tr.add(self._datafile, 0)

2429

2430

existing_handles = False

2430

existing_handles = False

2431

if self._writinghandles is not None:

2431

if self._writinghandles is not None:

2432

existing_handles = True

2432

existing_handles = True

2433

fp = self._writinghandles[0]

2433

fp = self._writinghandles[0]

2434

fp.flush()

2434

fp.flush()

2435

fp.close()

2435

fp.close()

2436

# We can't use the cached file handle after close(). So prevent

2436

# We can't use the cached file handle after close(). So prevent

2437

# its usage.

2437

# its usage.

2438

self._writinghandles = None

2438

self._writinghandles = None

2439

self._segmentfile.writing_handle = None

2439

self._segmentfile.writing_handle = None

2440

# No need to deal with sidedata writing handle as it is only

2440

# No need to deal with sidedata writing handle as it is only

2441

# relevant with revlog-v2 which is never inline, not reaching

2441

# relevant with revlog-v2 which is never inline, not reaching

2442

# this code

2442

# this code

2443

if side_write:

2443

if side_write:

2444

old_index_file_path = self._indexfile

2444

old_index_file_path = self._indexfile

2445

new_index_file_path = self._split_index_file

2445

new_index_file_path = self._split_index_file

2446

opener = self.opener

2446

opener = self.opener

2447

weak_self = weakref.ref(self)

2447

weak_self = weakref.ref(self)

2448

2449

# the "split" index replace the real index when the transaction is finalized

2449

# the "split" index replace the real index when the transaction is finalized

2450

def finalize_callback(tr):

2450

def finalize_callback(tr):

2451

opener.rename(

2451

opener.rename(

2452

new_index_file_path,

2452

new_index_file_path,

2453

old_index_file_path,

2453

old_index_file_path,

2454

checkambig=True,

2454

checkambig=True,

2455

)

2455

)

2456

maybe_self = weak_self()

2456

maybe_self = weak_self()

2457

if maybe_self is not None:

2457

if maybe_self is not None:

2458

maybe_self._indexfile = old_index_file_path

2458

maybe_self._indexfile = old_index_file_path

2459

2460

def abort_callback(tr):

2460

def abort_callback(tr):

2461

maybe_self = weak_self()

2461

maybe_self = weak_self()

2462

if maybe_self is not None:

2462

if maybe_self is not None:

2463

maybe_self._indexfile = old_index_file_path

2463

maybe_self._indexfile = old_index_file_path

2464

2465

tr.registertmp(new_index_file_path)

2465

tr.registertmp(new_index_file_path)

2466

if self.target[1] is not None:

2466

if self.target[1] is not None:

2467

callback_id = b'000-revlog-split-%d-%s' % self.target

2467

callback_id = b'000-revlog-split-%d-%s' % self.target

2468

else:

2468

else:

2469

callback_id = b'000-revlog-split-%d' % self.target[0]

2469

callback_id = b'000-revlog-split-%d' % self.target[0]

2470

tr.addfinalize(callback_id, finalize_callback)

2470

tr.addfinalize(callback_id, finalize_callback)

2471

tr.addabort(callback_id, abort_callback)

2471

tr.addabort(callback_id, abort_callback)

2472

2473

new_dfh = self._datafp(b'w+')

2473

new_dfh = self._datafp(b'w+')

2474

new_dfh.truncate(0) # drop any potentially existing data

2474

new_dfh.truncate(0) # drop any potentially existing data

2475

try:

2475

try:

2476

with self.reading():

2476

with self.reading():

2477

for r in self:

2477

for r in self:

2478

new_dfh.write(self._getsegmentforrevs(r, r)[1])

2478

new_dfh.write(self._getsegmentforrevs(r, r)[1])

2479

new_dfh.flush()

2479

new_dfh.flush()

2480

2481

if side_write:

2481

if side_write:

2482

self._indexfile = new_index_file_path

2482

self._indexfile = new_index_file_path

2483

with self.__index_new_fp() as fp:

2483

with self.__index_new_fp() as fp:

2484

self._format_flags &= ~FLAG_INLINE_DATA

2484

self._format_flags &= ~FLAG_INLINE_DATA

2485

self._inline = False

2485

self._inline = False

2486

for i in self:

2486

for i in self:

2487

e = self.index.entry_binary(i)

2487

e = self.index.entry_binary(i)

2488

if i == 0 and self._docket is None:

2488

if i == 0 and self._docket is None:

2489

header = self._format_flags | self._format_version

2489

header = self._format_flags | self._format_version

2490

header = self.index.pack_header(header)

2490

header = self.index.pack_header(header)

2491

e = header + e

2491

e = header + e

2492

fp.write(e)

2492

fp.write(e)

2493

if self._docket is not None:

2493

if self._docket is not None:

2494

self._docket.index_end = fp.tell()

2494

self._docket.index_end = fp.tell()

2495

2496

# If we don't use side-write, the temp file replace the real

2496

# If we don't use side-write, the temp file replace the real

2497

# index when we exit the context manager

2497

# index when we exit the context manager

2498

2499

nodemaputil.setup_persistent_nodemap(tr, self)

2499

nodemaputil.setup_persistent_nodemap(tr, self)

2500

self._segmentfile = randomaccessfile.randomaccessfile(

2500

self._segmentfile = randomaccessfile.randomaccessfile(

2501

self.opener,

2501

self.opener,

2502

self._datafile,

2502

self._datafile,

2503

self.data_config.chunk_cache_size,

2503

self.data_config.chunk_cache_size,

2504

)

2504

)

2505

2506

if existing_handles:

2506

if existing_handles:

2507

# switched from inline to conventional reopen the index

2507

# switched from inline to conventional reopen the index

2508

ifh = self.__index_write_fp()

2508

ifh = self.__index_write_fp()

2509

self._writinghandles = (ifh, new_dfh, None)

2509

self._writinghandles = (ifh, new_dfh, None)

2510

self._segmentfile.writing_handle = new_dfh

2510

self._segmentfile.writing_handle = new_dfh

2511

new_dfh = None

2511

new_dfh = None

2512

# No need to deal with sidedata writing handle as it is only

2512

# No need to deal with sidedata writing handle as it is only

2513

# relevant with revlog-v2 which is never inline, not reaching

2513

# relevant with revlog-v2 which is never inline, not reaching

2514

# this code

2514

# this code

2515

finally:

2515

finally:

2516

if new_dfh is not None:

2516

if new_dfh is not None:

2517

new_dfh.close()

2517

new_dfh.close()

2518

2519

def _nodeduplicatecallback(self, transaction, node):

2519

def _nodeduplicatecallback(self, transaction, node):

2520

"""called when trying to add a node already stored."""

2520

"""called when trying to add a node already stored."""

2521

2522

@contextlib.contextmanager

2522

@contextlib.contextmanager

2523

def reading(self):

2523

def reading(self):

2524

"""Context manager that keeps data and sidedata files open for reading"""

2524

"""Context manager that keeps data and sidedata files open for reading"""

2525

if len(self.index) == 0:

2525

if len(self.index) == 0:

2526

yield # nothing to be read

2526

yield # nothing to be read

2527

else:

2527

else:

2528

with self._segmentfile.reading():

2528

with self._segmentfile.reading():

2529

with self._segmentfile_sidedata.reading():

2529

with self._segmentfile_sidedata.reading():

2530

yield

2530

yield

2531

2532

@contextlib.contextmanager

2532

@contextlib.contextmanager

2533

def _writing(self, transaction):

2533

def _writing(self, transaction):

2534

if self._trypending:

2534

if self._trypending:

2535

msg = b'try to write in a `trypending` revlog: %s'

2535

msg = b'try to write in a `trypending` revlog: %s'

2536

msg %= self.display_id

2536

msg %= self.display_id

2537

raise error.ProgrammingError(msg)

2537

raise error.ProgrammingError(msg)

2538

if self._writinghandles is not None:

2538

if self._writinghandles is not None:

2539

yield

2539

yield

2540

else:

2540

else:

2541

ifh = dfh = sdfh = None

2541

ifh = dfh = sdfh = None

2542

try:

2542

try:

2543

r = len(self)

2543

r = len(self)

2544

# opening the data file.

2544

# opening the data file.

2545

dsize = 0

2545

dsize = 0

2546

if r:

2546

if r:

2547

dsize = self.end(r - 1)

2547

dsize = self.end(r - 1)

2548

dfh = None

2548

dfh = None

2549

if not self._inline:

2549

if not self._inline:

2550

try:

2550

try:

2551

dfh = self._datafp(b"r+")

2551

dfh = self._datafp(b"r+")

2552

if self._docket is None:

2552

if self._docket is None:

2553

dfh.seek(0, os.SEEK_END)

2553

dfh.seek(0, os.SEEK_END)

2554

else:

2554

else:

2555

dfh.seek(self._docket.data_end, os.SEEK_SET)

2555

dfh.seek(self._docket.data_end, os.SEEK_SET)

2556

except FileNotFoundError:

2556

except FileNotFoundError:

2557

dfh = self._datafp(b"w+")

2557

dfh = self._datafp(b"w+")

2558

transaction.add(self._datafile, dsize)

2558

transaction.add(self._datafile, dsize)

2559

if self._sidedatafile is not None:

2559

if self._sidedatafile is not None:

2560

# revlog-v2 does not inline, help Pytype

2560

# revlog-v2 does not inline, help Pytype

2561

assert dfh is not None

2561

assert dfh is not None

2562

try:

2562

try:

2563

sdfh = self.opener(self._sidedatafile, mode=b"r+")

2563

sdfh = self.opener(self._sidedatafile, mode=b"r+")

2564

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

2564

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

2565

except FileNotFoundError:

2565

except FileNotFoundError:

2566

sdfh = self.opener(self._sidedatafile, mode=b"w+")

2566

sdfh = self.opener(self._sidedatafile, mode=b"w+")

2567

transaction.add(

2567

transaction.add(

2568

self._sidedatafile, self._docket.sidedata_end

2568

self._sidedatafile, self._docket.sidedata_end

2569

)

2569

)

2570

2571

# opening the index file.

2571

# opening the index file.

2572

isize = r * self.index.entry_size

2572

isize = r * self.index.entry_size

2573

ifh = self.__index_write_fp()

2573

ifh = self.__index_write_fp()

2574

if self._inline:

2574

if self._inline:

2575

transaction.add(self._indexfile, dsize + isize)

2575

transaction.add(self._indexfile, dsize + isize)

2576

else:

2576

else:

2577

transaction.add(self._indexfile, isize)

2577

transaction.add(self._indexfile, isize)

2578

# exposing all file handle for writing.

2578

# exposing all file handle for writing.

2579

self._writinghandles = (ifh, dfh, sdfh)

2579

self._writinghandles = (ifh, dfh, sdfh)

2580

self._segmentfile.writing_handle = ifh if self._inline else dfh

2580

self._segmentfile.writing_handle = ifh if self._inline else dfh

2581

self._segmentfile_sidedata.writing_handle = sdfh

2581

self._segmentfile_sidedata.writing_handle = sdfh

2582

yield

2582

yield

2583

if self._docket is not None:

2583

if self._docket is not None:

2584

self._write_docket(transaction)

2584

self._write_docket(transaction)

2585

finally:

2585

finally:

2586

self._writinghandles = None

2586

self._writinghandles = None

2587

self._segmentfile.writing_handle = None

2587

self._segmentfile.writing_handle = None

2588

self._segmentfile_sidedata.writing_handle = None

2588

self._segmentfile_sidedata.writing_handle = None

2589

if dfh is not None:

2589

if dfh is not None:

2590

dfh.close()

2590

dfh.close()

2591

if sdfh is not None:

2591

if sdfh is not None:

2592

sdfh.close()

2592

sdfh.close()

2593

# closing the index file last to avoid exposing referent to

2593

# closing the index file last to avoid exposing referent to

2594

# potential unflushed data content.

2594

# potential unflushed data content.

2595

if ifh is not None:

2595

if ifh is not None:

2596

ifh.close()

2596

ifh.close()

2597

2598

def _write_docket(self, transaction):

2598

def _write_docket(self, transaction):

2599

"""write the current docket on disk

2599

"""write the current docket on disk

2600

2601

Exist as a method to help changelog to implement transaction logic

2601

Exist as a method to help changelog to implement transaction logic

2602

2603

We could also imagine using the same transaction logic for all revlog

2603

We could also imagine using the same transaction logic for all revlog

2604

since docket are cheap."""

2604

since docket are cheap."""

2605

self._docket.write(transaction)

2605

self._docket.write(transaction)

2606

2607

def addrevision(

2607

def addrevision(

2608

self,

2608

self,

2609

text,

2609

text,

2610

transaction,

2610

transaction,

2611

link,

2611

link,

2612

p1,

2612

p1,

2613

p2,

2613

p2,

2614

cachedelta=None,

2614

cachedelta=None,

2615

node=None,

2615

node=None,

2616

flags=REVIDX_DEFAULT_FLAGS,

2616

flags=REVIDX_DEFAULT_FLAGS,

2617

deltacomputer=None,

2617

deltacomputer=None,

2618

sidedata=None,

2618

sidedata=None,

2619

):

2619

):

2620

"""add a revision to the log

2620

"""add a revision to the log

2621

2622

text - the revision data to add

2622

text - the revision data to add

2623

transaction - the transaction object used for rollback

2623

transaction - the transaction object used for rollback

2624

link - the linkrev data to add

2624

link - the linkrev data to add

2625

p1, p2 - the parent nodeids of the revision

2625

p1, p2 - the parent nodeids of the revision

2626

cachedelta - an optional precomputed delta

2626

cachedelta - an optional precomputed delta

2627

node - nodeid of revision; typically node is not specified, and it is

2627

node - nodeid of revision; typically node is not specified, and it is

2628

computed by default as hash(text, p1, p2), however subclasses might

2628

computed by default as hash(text, p1, p2), however subclasses might

2629

use different hashing method (and override checkhash() in such case)

2629

use different hashing method (and override checkhash() in such case)

2630

flags - the known flags to set on the revision

2630

flags - the known flags to set on the revision

2631

deltacomputer - an optional deltacomputer instance shared between

2631

deltacomputer - an optional deltacomputer instance shared between

2632

multiple calls

2632

multiple calls

2633

"""

2633

"""

2634

if link == nullrev:

2634

if link == nullrev:

2635

raise error.RevlogError(

2635

raise error.RevlogError(

2636

_(b"attempted to add linkrev -1 to %s") % self.display_id

2636

_(b"attempted to add linkrev -1 to %s") % self.display_id

2637

)

2637

)

2638

2639

if sidedata is None:

2639

if sidedata is None:

2640

sidedata = {}

2640

sidedata = {}

2641

elif sidedata and not self.feature_config.has_side_data:

2641

elif sidedata and not self.feature_config.has_side_data:

2642

raise error.ProgrammingError(

2642

raise error.ProgrammingError(

2643

_(b"trying to add sidedata to a revlog who don't support them")

2643

_(b"trying to add sidedata to a revlog who don't support them")

2644

)

2644

)

2645

2646

if flags:

2646

if flags:

2647

node = node or self.hash(text, p1, p2)

2647

node = node or self.hash(text, p1, p2)

2648

2649

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

2649

rawtext, validatehash = flagutil.processflagswrite(self, text, flags)

2650

2651

# If the flag processor modifies the revision data, ignore any provided

2651

# If the flag processor modifies the revision data, ignore any provided

2652

# cachedelta.

2652

# cachedelta.

2653

if rawtext != text:

2653

if rawtext != text:

2654

cachedelta = None

2654

cachedelta = None

2655

2656

if len(rawtext) > _maxentrysize:

2656

if len(rawtext) > _maxentrysize:

2657

raise error.RevlogError(

2657

raise error.RevlogError(

2658

_(

2658

_(

2659

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

2659

b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"

2660

)

2660

)

2661

% (self.display_id, len(rawtext))

2661

% (self.display_id, len(rawtext))

2662

)

2662

)

2663

2664

node = node or self.hash(rawtext, p1, p2)

2664

node = node or self.hash(rawtext, p1, p2)

2665

rev = self.index.get_rev(node)

2665

rev = self.index.get_rev(node)

2666

if rev is not None:

2666

if rev is not None:

2667

return rev

2667

return rev

2668

2669

if validatehash:

2669

if validatehash:

2670

self.checkhash(rawtext, node, p1=p1, p2=p2)

2670

self.checkhash(rawtext, node, p1=p1, p2=p2)

2671

2672

return self.addrawrevision(

2672

return self.addrawrevision(

2673

rawtext,

2673

rawtext,

2674

transaction,

2674

transaction,

2675

link,

2675

link,

2676

p1,

2676

p1,

2677

p2,

2677

p2,

2678

node,

2678

node,

2679

flags,

2679

flags,

2680

cachedelta=cachedelta,

2680

cachedelta=cachedelta,

2681

deltacomputer=deltacomputer,

2681

deltacomputer=deltacomputer,

2682

sidedata=sidedata,

2682

sidedata=sidedata,

2683

)

2683

)

2684

2685

def addrawrevision(

2685

def addrawrevision(

2686

self,

2686

self,

2687

rawtext,

2687

rawtext,

2688

transaction,

2688

transaction,

2689

link,

2689

link,

2690

p1,

2690

p1,

2691

p2,

2691

p2,

2692

node,

2692

node,

2693

flags,

2693

flags,

2694

cachedelta=None,

2694

cachedelta=None,

2695

deltacomputer=None,

2695

deltacomputer=None,

2696

sidedata=None,

2696

sidedata=None,

2697

):

2697

):

2698

"""add a raw revision with known flags, node and parents

2698

"""add a raw revision with known flags, node and parents

2699

useful when reusing a revision not stored in this revlog (ex: received

2699

useful when reusing a revision not stored in this revlog (ex: received

2700

over wire, or read from an external bundle).

2700

over wire, or read from an external bundle).

2701

"""

2701

"""

2702

with self._writing(transaction):

2702

with self._writing(transaction):

2703

return self._addrevision(

2703

return self._addrevision(

2704

node,

2704

node,

2705

rawtext,

2705

rawtext,

2706

transaction,

2706

transaction,

2707

link,

2707

link,

2708

p1,

2708

p1,

2709

p2,

2709

p2,

2710

flags,

2710

flags,

2711

cachedelta,

2711

cachedelta,

2712

deltacomputer=deltacomputer,

2712

deltacomputer=deltacomputer,

2713

sidedata=sidedata,

2713

sidedata=sidedata,

2714

)

2714

)

2715

2716

def compress(self, data):

2716

def compress(self, data):

2717

"""Generate a possibly-compressed representation of data."""

2717

"""Generate a possibly-compressed representation of data."""

2718

if not data:

2718

if not data:

2719

return b'', data

2719

return b'', data

2720

2721

compressed = self._compressor.compress(data)

2721

compressed = self._compressor.compress(data)

2722

2723

if compressed:

2723

if compressed:

2724

# The revlog compressor added the header in the returned data.

2724

# The revlog compressor added the header in the returned data.

2725

return b'', compressed

2725

return b'', compressed

2726

2727

if data[0:1] == b'\0':

2727

if data[0:1] == b'\0':

2728

return b'', data

2728

return b'', data

2729

return b'u', data

2729

return b'u', data

2730

2731

def decompress(self, data):

2731

def decompress(self, data):

2732

"""Decompress a revlog chunk.

2732

"""Decompress a revlog chunk.

2733

2734

The chunk is expected to begin with a header identifying the

2734

The chunk is expected to begin with a header identifying the

2735

format type so it can be routed to an appropriate decompressor.

2735

format type so it can be routed to an appropriate decompressor.

2736

"""

2736

"""

2737

if not data:

2737

if not data:

2738

return data

2738

return data

2739

2740

# Revlogs are read much more frequently than they are written and many

2740

# Revlogs are read much more frequently than they are written and many

2741

# chunks only take microseconds to decompress, so performance is

2741

# chunks only take microseconds to decompress, so performance is

2742

# important here.

2742

# important here.

2743

#

2743

#

2744

# We can make a few assumptions about revlogs:

2744

# We can make a few assumptions about revlogs:

2745

#

2745

#

2746

# 1) the majority of chunks will be compressed (as opposed to inline

2746

# 1) the majority of chunks will be compressed (as opposed to inline

2747

# raw data).

2747

# raw data).

2748

# 2) decompressing *any* data will likely by at least 10x slower than

2748

# 2) decompressing *any* data will likely by at least 10x slower than

2749

# returning raw inline data.

2749

# returning raw inline data.

2750

# 3) we want to prioritize common and officially supported compression

2750

# 3) we want to prioritize common and officially supported compression

2751

# engines

2751

# engines

2752

#

2752

#

2753

# It follows that we want to optimize for "decompress compressed data

2753

# It follows that we want to optimize for "decompress compressed data

2754

# when encoded with common and officially supported compression engines"

2754

# when encoded with common and officially supported compression engines"

2755

# case over "raw data" and "data encoded by less common or non-official

2755

# case over "raw data" and "data encoded by less common or non-official

2756

# compression engines." That is why we have the inline lookup first

2756

# compression engines." That is why we have the inline lookup first

2757

# followed by the compengines lookup.

2757

# followed by the compengines lookup.

2758

#

2758

#

2759

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

2759

# According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib

2760

# compressed chunks. And this matters for changelog and manifest reads.

2760

# compressed chunks. And this matters for changelog and manifest reads.

2761

t = data[0:1]

2761

t = data[0:1]

2762

2763

if t == b'x':

2763

if t == b'x':

2764

try:

2764

try:

2765

return _zlibdecompress(data)

2765

return _zlibdecompress(data)

2766

except zlib.error as e:

2766

except zlib.error as e:

2767

raise error.RevlogError(

2767

raise error.RevlogError(

2768

_(b'revlog decompress error: %s')

2768

_(b'revlog decompress error: %s')

2769

% stringutil.forcebytestr(e)

2769

% stringutil.forcebytestr(e)

2770

)

2770

)

2771

# '\0' is more common than 'u' so it goes first.

2771

# '\0' is more common than 'u' so it goes first.

2772

elif t == b'\0':

2772

elif t == b'\0':

2773

return data

2773

return data

2774

elif t == b'u':

2774

elif t == b'u':

2775

return util.buffer(data, 1)

2775

return util.buffer(data, 1)

2776

2777

compressor = self._get_decompressor(t)

2777

compressor = self._get_decompressor(t)

2778

2779

return compressor.decompress(data)

2779

return compressor.decompress(data)

2780

2781

def _addrevision(

2781

def _addrevision(

2782

self,

2782

self,

2783

node,

2783

node,

2784

rawtext,

2784

rawtext,

2785

transaction,

2785

transaction,

2786

link,

2786

link,

2787

p1,

2787

p1,

2788

p2,

2788

p2,

2789

flags,

2789

flags,

2790

cachedelta,

2790

cachedelta,

2791

alwayscache=False,

2791

alwayscache=False,

2792

deltacomputer=None,

2792

deltacomputer=None,

2793

sidedata=None,

2793

sidedata=None,

2794

):

2794

):

2795

"""internal function to add revisions to the log

2795

"""internal function to add revisions to the log

2796

2797

see addrevision for argument descriptions.

2797

see addrevision for argument descriptions.

2798

2799

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

2799

note: "addrevision" takes non-raw text, "_addrevision" takes raw text.

2800

2801

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

2801

if "deltacomputer" is not provided or None, a defaultdeltacomputer will

2802

be used.

2802

be used.

2803

2804

invariants:

2804

invariants:

2805

- rawtext is optional (can be None); if not set, cachedelta must be set.

2805

- rawtext is optional (can be None); if not set, cachedelta must be set.

2806

if both are set, they must correspond to each other.

2806

if both are set, they must correspond to each other.

2807

"""

2807

"""

2808

if node == self.nullid:

2808

if node == self.nullid:

2809

raise error.RevlogError(

2809

raise error.RevlogError(

2810

_(b"%s: attempt to add null revision") % self.display_id

2810

_(b"%s: attempt to add null revision") % self.display_id

2811

)

2811

)

2812

if (

2812

if (

2813

node == self.nodeconstants.wdirid

2813

node == self.nodeconstants.wdirid

2814

or node in self.nodeconstants.wdirfilenodeids

2814

or node in self.nodeconstants.wdirfilenodeids

2815

):

2815

):

2816

raise error.RevlogError(

2816

raise error.RevlogError(

2817

_(b"%s: attempt to add wdir revision") % self.display_id

2817

_(b"%s: attempt to add wdir revision") % self.display_id

2818

)

2818

)

2819

if self._writinghandles is None:

2819

if self._writinghandles is None:

2820

msg = b'adding revision outside `revlog._writing` context'

2820

msg = b'adding revision outside `revlog._writing` context'

2821

raise error.ProgrammingError(msg)

2821

raise error.ProgrammingError(msg)

2822

2823

btext = [rawtext]

2823

btext = [rawtext]

2824

2825

curr = len(self)

2825

curr = len(self)

2826

prev = curr - 1

2826

prev = curr - 1

2827

2828

offset = self._get_data_offset(prev)

2828

offset = self._get_data_offset(prev)

2829

2830

if self._concurrencychecker:

2830

if self._concurrencychecker:

2831

ifh, dfh, sdfh = self._writinghandles

2831

ifh, dfh, sdfh = self._writinghandles

2832

# XXX no checking for the sidedata file

2832

# XXX no checking for the sidedata file

2833

if self._inline:

2833

if self._inline:

2834

# offset is "as if" it were in the .d file, so we need to add on

2834

# offset is "as if" it were in the .d file, so we need to add on

2835

# the size of the entry metadata.

2835

# the size of the entry metadata.

2836

self._concurrencychecker(

2836

self._concurrencychecker(

2837

ifh, self._indexfile, offset + curr * self.index.entry_size

2837

ifh, self._indexfile, offset + curr * self.index.entry_size

2838

)

2838

)

2839

else:

2839

else:

2840

# Entries in the .i are a consistent size.

2840

# Entries in the .i are a consistent size.

2841

self._concurrencychecker(

2841

self._concurrencychecker(

2842

ifh, self._indexfile, curr * self.index.entry_size

2842

ifh, self._indexfile, curr * self.index.entry_size

2843

)

2843

)

2844

self._concurrencychecker(dfh, self._datafile, offset)

2844

self._concurrencychecker(dfh, self._datafile, offset)

2845

2846

p1r, p2r = self.rev(p1), self.rev(p2)

2846

p1r, p2r = self.rev(p1), self.rev(p2)

2847

2848

# full versions are inserted when the needed deltas

2848

# full versions are inserted when the needed deltas

2849

# become comparable to the uncompressed text

2849

# become comparable to the uncompressed text

2850

if rawtext is None:

2850

if rawtext is None:

2851

# need rawtext size, before changed by flag processors, which is

2851

# need rawtext size, before changed by flag processors, which is

2852

# the non-raw size. use revlog explicitly to avoid filelog's extra

2852

# the non-raw size. use revlog explicitly to avoid filelog's extra

2853

# logic that might remove metadata size.

2853

# logic that might remove metadata size.

2854

textlen = mdiff.patchedsize(

2854

textlen = mdiff.patchedsize(

2855

revlog.size(self, cachedelta[0]), cachedelta[1]

2855

revlog.size(self, cachedelta[0]), cachedelta[1]

2856

)

2856

)

2857

else:

2857

else:

2858

textlen = len(rawtext)

2858

textlen = len(rawtext)

2859

2860

if deltacomputer is None:

2860

if deltacomputer is None:

2861

write_debug = None

2861

write_debug = None

2862

if self.delta_config.debug_delta:

2862

if self.delta_config.debug_delta:

2863

write_debug = transaction._report

2863

write_debug = transaction._report

2864

deltacomputer = deltautil.deltacomputer(

2864

deltacomputer = deltautil.deltacomputer(

2865

self, write_debug=write_debug

2865

self, write_debug=write_debug

2866

)

2866

)

2867

2868

if cachedelta is not None and len(cachedelta) == 2:

2868

if cachedelta is not None and len(cachedelta) == 2:

2869

# If the cached delta has no information about how it should be

2869

# If the cached delta has no information about how it should be

2870

# reused, add the default reuse instruction according to the

2870

# reused, add the default reuse instruction according to the

2871

# revlog's configuration.

2871

# revlog's configuration.

2872

if (

2872

if (

2873

self.delta_config.general_delta

2873

self.delta_config.general_delta

2874

and self.delta_config.lazy_delta_base

2874

and self.delta_config.lazy_delta_base

2875

):

2875

):

2876

delta_base_reuse = DELTA_BASE_REUSE_TRY

2876

delta_base_reuse = DELTA_BASE_REUSE_TRY

2877

else:

2877

else:

2878

delta_base_reuse = DELTA_BASE_REUSE_NO

2878

delta_base_reuse = DELTA_BASE_REUSE_NO

2879

cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)

2879

cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)

2880

2881

revinfo = revlogutils.revisioninfo(

2881

revinfo = revlogutils.revisioninfo(

2882

node,

2882

node,

2883

p1,

2883

p1,

2884

p2,

2884

p2,

2885

btext,

2885

btext,

2886

textlen,

2886

textlen,

2887

cachedelta,

2887

cachedelta,

2888

flags,

2888

flags,

2889

)

2889

)

2890

2891

deltainfo = deltacomputer.finddeltainfo(revinfo)

2891

deltainfo = deltacomputer.finddeltainfo(revinfo)

2892

2893

compression_mode = COMP_MODE_INLINE

2893

compression_mode = COMP_MODE_INLINE

2894

if self._docket is not None:

2894

if self._docket is not None:

2895

default_comp = self._docket.default_compression_header

2895

default_comp = self._docket.default_compression_header

2896

r = deltautil.delta_compression(default_comp, deltainfo)

2896

r = deltautil.delta_compression(default_comp, deltainfo)

2897

compression_mode, deltainfo = r

2897

compression_mode, deltainfo = r

2898

2899

sidedata_compression_mode = COMP_MODE_INLINE

2899

sidedata_compression_mode = COMP_MODE_INLINE

2900

if sidedata and self.feature_config.has_side_data:

2900

if sidedata and self.feature_config.has_side_data:

2901

sidedata_compression_mode = COMP_MODE_PLAIN

2901

sidedata_compression_mode = COMP_MODE_PLAIN

2902

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

2902

serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)

2903

sidedata_offset = self._docket.sidedata_end

2903

sidedata_offset = self._docket.sidedata_end

2904

h, comp_sidedata = self.compress(serialized_sidedata)

2904

h, comp_sidedata = self.compress(serialized_sidedata)

2905

if (

2905

if (

2906

h != b'u'

2906

h != b'u'

2907

and comp_sidedata[0:1] != b'\0'

2907

and comp_sidedata[0:1] != b'\0'

2908

and len(comp_sidedata) < len(serialized_sidedata)

2908

and len(comp_sidedata) < len(serialized_sidedata)

2909

):

2909

):

2910

assert not h

2910

assert not h

2911

if (

2911

if (

2912

comp_sidedata[0:1]

2912

comp_sidedata[0:1]

2913

== self._docket.default_compression_header

2913

== self._docket.default_compression_header

2914

):

2914

):

2915

sidedata_compression_mode = COMP_MODE_DEFAULT

2915

sidedata_compression_mode = COMP_MODE_DEFAULT

2916

serialized_sidedata = comp_sidedata

2916

serialized_sidedata = comp_sidedata

2917

else:

2917

else:

2918

sidedata_compression_mode = COMP_MODE_INLINE

2918

sidedata_compression_mode = COMP_MODE_INLINE

2919

serialized_sidedata = comp_sidedata

2919

serialized_sidedata = comp_sidedata

2920

else:

2920

else:

2921

serialized_sidedata = b""

2921

serialized_sidedata = b""

2922

# Don't store the offset if the sidedata is empty, that way

2922

# Don't store the offset if the sidedata is empty, that way

2923

# we can easily detect empty sidedata and they will be no different

2923

# we can easily detect empty sidedata and they will be no different

2924

# than ones we manually add.

2924

# than ones we manually add.

2925

sidedata_offset = 0

2925

sidedata_offset = 0

2926

2927

rank = RANK_UNKNOWN

2927

rank = RANK_UNKNOWN

2928

if self.feature_config.compute_rank:

2928

if self.feature_config.compute_rank:

2929

if (p1r, p2r) == (nullrev, nullrev):

2929

if (p1r, p2r) == (nullrev, nullrev):

2930

rank = 1

2930

rank = 1

2931

elif p1r != nullrev and p2r == nullrev:

2931

elif p1r != nullrev and p2r == nullrev:

2932

rank = 1 + self.fast_rank(p1r)

2932

rank = 1 + self.fast_rank(p1r)

2933

elif p1r == nullrev and p2r != nullrev:

2933

elif p1r == nullrev and p2r != nullrev:

2934

rank = 1 + self.fast_rank(p2r)

2934

rank = 1 + self.fast_rank(p2r)

2935

else: # merge node

2935

else: # merge node

2936

if rustdagop is not None and self.index.rust_ext_compat:

2936

if rustdagop is not None and self.index.rust_ext_compat:

2937

rank = rustdagop.rank(self.index, p1r, p2r)

2937

rank = rustdagop.rank(self.index, p1r, p2r)

2938

else:

2938

else:

2939

pmin, pmax = sorted((p1r, p2r))

2939

pmin, pmax = sorted((p1r, p2r))

2940

rank = 1 + self.fast_rank(pmax)

2940

rank = 1 + self.fast_rank(pmax)

2941

rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))

2941

rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))

2942

2943

e = revlogutils.entry(

2943

e = revlogutils.entry(

2944

flags=flags,

2944

flags=flags,

2945

data_offset=offset,

2945

data_offset=offset,

2946

data_compressed_length=deltainfo.deltalen,

2946

data_compressed_length=deltainfo.deltalen,

2947

data_uncompressed_length=textlen,

2947

data_uncompressed_length=textlen,

2948

data_compression_mode=compression_mode,

2948

data_compression_mode=compression_mode,

2949

data_delta_base=deltainfo.base,

2949

data_delta_base=deltainfo.base,

2950

link_rev=link,

2950

link_rev=link,

2951

parent_rev_1=p1r,

2951

parent_rev_1=p1r,

2952

parent_rev_2=p2r,

2952

parent_rev_2=p2r,

2953

node_id=node,

2953

node_id=node,

2954

sidedata_offset=sidedata_offset,

2954

sidedata_offset=sidedata_offset,

2955

sidedata_compressed_length=len(serialized_sidedata),

2955

sidedata_compressed_length=len(serialized_sidedata),

2956

sidedata_compression_mode=sidedata_compression_mode,

2956

sidedata_compression_mode=sidedata_compression_mode,

2957

rank=rank,

2957

rank=rank,

2958

)

2958

)

2959

2960

self.index.append(e)

2960

self.index.append(e)

2961

entry = self.index.entry_binary(curr)

2961

entry = self.index.entry_binary(curr)

2962

if curr == 0 and self._docket is None:

2962

if curr == 0 and self._docket is None:

2963

header = self._format_flags | self._format_version

2963

header = self._format_flags | self._format_version

2964

header = self.index.pack_header(header)

2964

header = self.index.pack_header(header)

2965

entry = header + entry

2965

entry = header + entry

2966

self._writeentry(

2966

self._writeentry(

2967

transaction,

2967

transaction,

2968

entry,

2968

entry,

2969

deltainfo.data,

2969

deltainfo.data,

2970

link,

2970

link,

2971

offset,

2971

offset,

2972

serialized_sidedata,

2972

serialized_sidedata,

2973

sidedata_offset,

2973

sidedata_offset,

2974

)

2974

)

2975

2976

rawtext = btext[0]

2976

rawtext = btext[0]

2977

2978

if alwayscache and rawtext is None:

2978

if alwayscache and rawtext is None:

2979

rawtext = deltacomputer.buildtext(revinfo)

2979

rawtext = deltacomputer.buildtext(revinfo)

2980

2981

if type(rawtext) == bytes: # only accept immutable objects

2981

if type(rawtext) == bytes: # only accept immutable objects

2982

self._revisioncache = (node, curr, rawtext)

2982

self._revisioncache = (node, curr, rawtext)

2983

self._chainbasecache[curr] = deltainfo.chainbase

2983

self._chainbasecache[curr] = deltainfo.chainbase

2984

return curr

2984

return curr

2985

2986

def _get_data_offset(self, prev):

2986

def _get_data_offset(self, prev):

2987

"""Returns the current offset in the (in-transaction) data file.

2987

"""Returns the current offset in the (in-transaction) data file.

2988

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

2988

Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket

2989

file to store that information: since sidedata can be rewritten to the

2989

file to store that information: since sidedata can be rewritten to the

2990

end of the data file within a transaction, you can have cases where, for

2990

end of the data file within a transaction, you can have cases where, for

2991

example, rev `n` does not have sidedata while rev `n - 1` does, leading

2991

example, rev `n` does not have sidedata while rev `n - 1` does, leading

2992

to `n - 1`'s sidedata being written after `n`'s data.

2992

to `n - 1`'s sidedata being written after `n`'s data.

2993

2994

TODO cache this in a docket file before getting out of experimental."""

2994

TODO cache this in a docket file before getting out of experimental."""

2995

if self._docket is None:

2995

if self._docket is None:

2996

return self.end(prev)

2996

return self.end(prev)

2997

else:

2997

else:

2998

return self._docket.data_end

2998

return self._docket.data_end

2999

3000

def _writeentry(

3000

def _writeentry(

3001

self, transaction, entry, data, link, offset, sidedata, sidedata_offset

3001

self, transaction, entry, data, link, offset, sidedata, sidedata_offset

3002

):

3002

):

3003

# Files opened in a+ mode have inconsistent behavior on various

3003

# Files opened in a+ mode have inconsistent behavior on various

3004

# platforms. Windows requires that a file positioning call be made

3004

# platforms. Windows requires that a file positioning call be made

3005

# when the file handle transitions between reads and writes. See

3005

# when the file handle transitions between reads and writes. See

3006

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

3006

# 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other

3007

# platforms, Python or the platform itself can be buggy. Some versions

3007

# platforms, Python or the platform itself can be buggy. Some versions

3008

# of Solaris have been observed to not append at the end of the file

3008

# of Solaris have been observed to not append at the end of the file

3009

# if the file was seeked to before the end. See issue4943 for more.

3009

# if the file was seeked to before the end. See issue4943 for more.

3010

#

3010

#

3011

# We work around this issue by inserting a seek() before writing.

3011

# We work around this issue by inserting a seek() before writing.

3012

# Note: This is likely not necessary on Python 3. However, because

3012

# Note: This is likely not necessary on Python 3. However, because

3013

# the file handle is reused for reads and may be seeked there, we need

3013

# the file handle is reused for reads and may be seeked there, we need

3014

# to be careful before changing this.

3014

# to be careful before changing this.

3015

if self._writinghandles is None:

3015

if self._writinghandles is None:

3016

msg = b'adding revision outside `revlog._writing` context'

3016

msg = b'adding revision outside `revlog._writing` context'

3017

raise error.ProgrammingError(msg)

3017

raise error.ProgrammingError(msg)

3018

ifh, dfh, sdfh = self._writinghandles

3018

ifh, dfh, sdfh = self._writinghandles

3019

if self._docket is None:

3019

if self._docket is None:

3020

ifh.seek(0, os.SEEK_END)

3020

ifh.seek(0, os.SEEK_END)

3021

else:

3021

else:

3022

ifh.seek(self._docket.index_end, os.SEEK_SET)

3022

ifh.seek(self._docket.index_end, os.SEEK_SET)

3023

if dfh:

3023

if dfh:

3024

if self._docket is None:

3024

if self._docket is None:

3025

dfh.seek(0, os.SEEK_END)

3025

dfh.seek(0, os.SEEK_END)

3026

else:

3026

else:

3027

dfh.seek(self._docket.data_end, os.SEEK_SET)

3027

dfh.seek(self._docket.data_end, os.SEEK_SET)

3028

if sdfh:

3028

if sdfh:

3029

sdfh.seek(self._docket.sidedata_end, os.SEEK_SET)

3029

sdfh.seek(self._docket.sidedata_end, os.SEEK_SET)

3030

3031

curr = len(self) - 1

3031

curr = len(self) - 1

3032

if not self._inline:

3032

if not self._inline:

3033

transaction.add(self._datafile, offset)

3033

transaction.add(self._datafile, offset)

3034

if self._sidedatafile:

3034

if self._sidedatafile:

3035

transaction.add(self._sidedatafile, sidedata_offset)

3035

transaction.add(self._sidedatafile, sidedata_offset)

3036

transaction.add(self._indexfile, curr * len(entry))

3036

transaction.add(self._indexfile, curr * len(entry))

3037

if data[0]:

3037

if data[0]:

3038

dfh.write(data[0])

3038

dfh.write(data[0])

3039

dfh.write(data[1])

3039

dfh.write(data[1])

3040

if sidedata:

3040

if sidedata:

3041

sdfh.write(sidedata)

3041

sdfh.write(sidedata)

3042

ifh.write(entry)

3042

ifh.write(entry)

3043

else:

3043

else:

3044

offset += curr * self.index.entry_size

3044

offset += curr * self.index.entry_size

3045

transaction.add(self._indexfile, offset)

3045

transaction.add(self._indexfile, offset)

3046

ifh.write(entry)

3046

ifh.write(entry)

3047

ifh.write(data[0])

3047

ifh.write(data[0])

3048

ifh.write(data[1])

3048

ifh.write(data[1])

3049

assert not sidedata

3049

assert not sidedata

3050

self._enforceinlinesize(transaction)

3050

self._enforceinlinesize(transaction)

3051

if self._docket is not None:

3051

if self._docket is not None:

3052

# revlog-v2 always has 3 writing handles, help Pytype

3052

# revlog-v2 always has 3 writing handles, help Pytype

3053

wh1 = self._writinghandles[0]

3053

wh1 = self._writinghandles[0]

3054

wh2 = self._writinghandles[1]

3054

wh2 = self._writinghandles[1]

3055

wh3 = self._writinghandles[2]

3055

wh3 = self._writinghandles[2]

3056

assert wh1 is not None

3056

assert wh1 is not None

3057

assert wh2 is not None

3057

assert wh2 is not None

3058

assert wh3 is not None

3058

assert wh3 is not None

3059

self._docket.index_end = wh1.tell()

3059

self._docket.index_end = wh1.tell()

3060

self._docket.data_end = wh2.tell()

3060

self._docket.data_end = wh2.tell()

3061

self._docket.sidedata_end = wh3.tell()

3061

self._docket.sidedata_end = wh3.tell()

3062

3063

nodemaputil.setup_persistent_nodemap(transaction, self)

3063

nodemaputil.setup_persistent_nodemap(transaction, self)

3064

3065

def addgroup(

3065

def addgroup(

3066

self,

3066

self,

3067

deltas,

3067

deltas,

3068

linkmapper,

3068

linkmapper,

3069

transaction,

3069

transaction,

3070

alwayscache=False,

3070

alwayscache=False,

3071

addrevisioncb=None,

3071

addrevisioncb=None,

3072

duplicaterevisioncb=None,

3072

duplicaterevisioncb=None,

3073

debug_info=None,

3073

debug_info=None,

3074

delta_base_reuse_policy=None,

3074

delta_base_reuse_policy=None,

3075

):

3075

):

3076

"""

3076

"""

3077

add a delta group

3077

add a delta group

3078

3079

given a set of deltas, add them to the revision log. the

3079

given a set of deltas, add them to the revision log. the

3080

first delta is against its parent, which should be in our

3080

first delta is against its parent, which should be in our

3081

log, the rest are against the previous delta.

3081

log, the rest are against the previous delta.

3082

3083

If ``addrevisioncb`` is defined, it will be called with arguments of

3083

If ``addrevisioncb`` is defined, it will be called with arguments of

3084

this revlog and the node that was added.

3084

this revlog and the node that was added.

3085

"""

3085

"""

3086

3087

if self._adding_group:

3087

if self._adding_group:

3088

raise error.ProgrammingError(b'cannot nest addgroup() calls')

3088

raise error.ProgrammingError(b'cannot nest addgroup() calls')

3089

3090

# read the default delta-base reuse policy from revlog config if the

3090

# read the default delta-base reuse policy from revlog config if the

3091

# group did not specify one.

3091

# group did not specify one.

3092

if delta_base_reuse_policy is None:

3092

if delta_base_reuse_policy is None:

3093

if (

3093

if (

3094

self.delta_config.general_delta

3094

self.delta_config.general_delta

3095

and self.delta_config.lazy_delta_base

3095

and self.delta_config.lazy_delta_base

3096

):

3096

):

3097

delta_base_reuse_policy = DELTA_BASE_REUSE_TRY

3097

delta_base_reuse_policy = DELTA_BASE_REUSE_TRY

3098

else:

3098

else:

3099

delta_base_reuse_policy = DELTA_BASE_REUSE_NO

3099

delta_base_reuse_policy = DELTA_BASE_REUSE_NO

3100

3101

self._adding_group = True

3101

self._adding_group = True

3102

empty = True

3102

empty = True

3103

try:

3103

try:

3104

with self._writing(transaction):

3104

with self._writing(transaction):

3105

write_debug = None

3105

write_debug = None

3106

if self.delta_config.debug_delta:

3106

if self.delta_config.debug_delta:

3107

write_debug = transaction._report

3107

write_debug = transaction._report

3108

deltacomputer = deltautil.deltacomputer(

3108

deltacomputer = deltautil.deltacomputer(

3109

self,

3109

self,

3110

write_debug=write_debug,

3110

write_debug=write_debug,

3111

debug_info=debug_info,

3111

debug_info=debug_info,

3112

)

3112

)

3113

# loop through our set of deltas

3113

# loop through our set of deltas

3114

for data in deltas:

3114

for data in deltas:

3115

(

3115

(

3116

node,

3116

node,

3117

p1,

3117

p1,

3118

p2,

3118

p2,

3119

linknode,

3119

linknode,

3120

deltabase,

3120

deltabase,

3121

delta,

3121

delta,

3122

flags,

3122

flags,

3123

sidedata,

3123

sidedata,

3124

) = data

3124

) = data

3125

link = linkmapper(linknode)

3125

link = linkmapper(linknode)

3126

flags = flags or REVIDX_DEFAULT_FLAGS

3126

flags = flags or REVIDX_DEFAULT_FLAGS

3127

3128

rev = self.index.get_rev(node)

3128

rev = self.index.get_rev(node)

3129

if rev is not None:

3129

if rev is not None:

3130

# this can happen if two branches make the same change

3130

# this can happen if two branches make the same change

3131

self._nodeduplicatecallback(transaction, rev)

3131

self._nodeduplicatecallback(transaction, rev)

3132

if duplicaterevisioncb:

3132

if duplicaterevisioncb:

3133

duplicaterevisioncb(self, rev)

3133

duplicaterevisioncb(self, rev)

3134

empty = False

3134

empty = False

3135

continue

3135

continue

3136

3137

for p in (p1, p2):

3137

for p in (p1, p2):

3138

if not self.index.has_node(p):

3138

if not self.index.has_node(p):

3139

raise error.LookupError(

3139

raise error.LookupError(

3140

p, self.radix, _(b'unknown parent')

3140

p, self.radix, _(b'unknown parent')

3141

)

3141

)

3142

3143

if not self.index.has_node(deltabase):

3143

if not self.index.has_node(deltabase):

3144

raise error.LookupError(

3144

raise error.LookupError(

3145

deltabase, self.display_id, _(b'unknown delta base')

3145

deltabase, self.display_id, _(b'unknown delta base')

3146

)

3146

)

3147

3148

baserev = self.rev(deltabase)

3148

baserev = self.rev(deltabase)

3149

3150

if baserev != nullrev and self.iscensored(baserev):

3150

if baserev != nullrev and self.iscensored(baserev):

3151

# if base is censored, delta must be full replacement in a

3151

# if base is censored, delta must be full replacement in a

3152

# single patch operation

3152

# single patch operation

3153

hlen = struct.calcsize(b">lll")

3153

hlen = struct.calcsize(b">lll")

3154

oldlen = self.rawsize(baserev)

3154

oldlen = self.rawsize(baserev)

3155

newlen = len(delta) - hlen

3155

newlen = len(delta) - hlen

3156

if delta[:hlen] != mdiff.replacediffheader(

3156

if delta[:hlen] != mdiff.replacediffheader(

3157

oldlen, newlen

3157

oldlen, newlen

3158

):

3158

):

3159

raise error.CensoredBaseError(

3159

raise error.CensoredBaseError(

3160

self.display_id, self.node(baserev)

3160

self.display_id, self.node(baserev)

3161

)

3161

)

3162

3163

if not flags and self._peek_iscensored(baserev, delta):

3163

if not flags and self._peek_iscensored(baserev, delta):

3164

flags |= REVIDX_ISCENSORED

3164

flags |= REVIDX_ISCENSORED

3165

3166

# We assume consumers of addrevisioncb will want to retrieve

3166

# We assume consumers of addrevisioncb will want to retrieve

3167

# the added revision, which will require a call to

3167

# the added revision, which will require a call to

3168

# revision(). revision() will fast path if there is a cache

3168

# revision(). revision() will fast path if there is a cache

3169

# hit. So, we tell _addrevision() to always cache in this case.

3169

# hit. So, we tell _addrevision() to always cache in this case.

3170

# We're only using addgroup() in the context of changegroup

3170

# We're only using addgroup() in the context of changegroup

3171

# generation so the revision data can always be handled as raw

3171

# generation so the revision data can always be handled as raw

3172

# by the flagprocessor.

3172

# by the flagprocessor.

3173

rev = self._addrevision(

3173

rev = self._addrevision(

3174

node,

3174

node,

3175

None,

3175

None,

3176

transaction,

3176

transaction,

3177

link,

3177

link,

3178

p1,

3178

p1,

3179

p2,

3179

p2,

3180

flags,

3180

flags,

3181

(baserev, delta, delta_base_reuse_policy),

3181

(baserev, delta, delta_base_reuse_policy),

3182

alwayscache=alwayscache,

3182

alwayscache=alwayscache,

3183

deltacomputer=deltacomputer,

3183

deltacomputer=deltacomputer,

3184

sidedata=sidedata,

3184

sidedata=sidedata,

3185

)

3185

)

3186

3187

if addrevisioncb:

3187

if addrevisioncb:

3188

addrevisioncb(self, rev)

3188

addrevisioncb(self, rev)

3189

empty = False

3189

empty = False

3190

finally:

3190

finally:

3191

self._adding_group = False

3191

self._adding_group = False

3192

return not empty

3192

return not empty

3193

3194

def iscensored(self, rev):

3194

def iscensored(self, rev):

3195

"""Check if a file revision is censored."""

3195

"""Check if a file revision is censored."""

3196

if not self.feature_config.censorable:

3196

if not self.feature_config.censorable:

3197

return False

3197

return False

3198

3199

return self.flags(rev) & REVIDX_ISCENSORED

3199

return self.flags(rev) & REVIDX_ISCENSORED

3200

3201

def _peek_iscensored(self, baserev, delta):

3201

def _peek_iscensored(self, baserev, delta):

3202

"""Quickly check if a delta produces a censored revision."""

3202

"""Quickly check if a delta produces a censored revision."""

3203

if not self.feature_config.censorable:

3203

if not self.feature_config.censorable:

3204

return False

3204

return False

3205

3206

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

3206

return storageutil.deltaiscensored(delta, baserev, self.rawsize)

3207

3208

def getstrippoint(self, minlink):

3208

def getstrippoint(self, minlink):

3209

"""find the minimum rev that must be stripped to strip the linkrev

3209

"""find the minimum rev that must be stripped to strip the linkrev

3210

3211

Returns a tuple containing the minimum rev and a set of all revs that

3211

Returns a tuple containing the minimum rev and a set of all revs that

3212

have linkrevs that will be broken by this strip.

3212

have linkrevs that will be broken by this strip.

3213

"""

3213

"""

3214

return storageutil.resolvestripinfo(

3214

return storageutil.resolvestripinfo(

3215

minlink,

3215

minlink,

3216

len(self) - 1,

3216

len(self) - 1,

3217

self.headrevs(),

3217

self.headrevs(),

3218

self.linkrev,

3218

self.linkrev,

3219

self.parentrevs,

3219

self.parentrevs,

3220

)

3220

)

3221

3222

def strip(self, minlink, transaction):

3222

def strip(self, minlink, transaction):

3223

"""truncate the revlog on the first revision with a linkrev >= minlink

3223

"""truncate the revlog on the first revision with a linkrev >= minlink

3224

3225

This function is called when we're stripping revision minlink and

3225

This function is called when we're stripping revision minlink and

3226

its descendants from the repository.

3226

its descendants from the repository.

3227

3228

We have to remove all revisions with linkrev >= minlink, because

3228

We have to remove all revisions with linkrev >= minlink, because

3229

the equivalent changelog revisions will be renumbered after the

3229

the equivalent changelog revisions will be renumbered after the

3230

strip.

3230

strip.

3231

3232

So we truncate the revlog on the first of these revisions, and

3232

So we truncate the revlog on the first of these revisions, and

3233

trust that the caller has saved the revisions that shouldn't be

3233

trust that the caller has saved the revisions that shouldn't be

3234

removed and that it'll re-add them after this truncation.

3234

removed and that it'll re-add them after this truncation.

3235

"""

3235

"""

3236

if len(self) == 0:

3236

if len(self) == 0:

3237

return

3237

return

3238

3239

rev, _ = self.getstrippoint(minlink)

3239

rev, _ = self.getstrippoint(minlink)

3240

if rev == len(self):

3240

if rev == len(self):

3241

return

3241

return

3242

3243

# first truncate the files on disk

3243

# first truncate the files on disk

3244

data_end = self.start(rev)

3244

data_end = self.start(rev)

3245

if not self._inline:

3245

if not self._inline:

3246

transaction.add(self._datafile, data_end)

3246

transaction.add(self._datafile, data_end)

3247

end = rev * self.index.entry_size

3247

end = rev * self.index.entry_size

3248

else:

3248

else:

3249

end = data_end + (rev * self.index.entry_size)

3249

end = data_end + (rev * self.index.entry_size)

3250

3251

if self._sidedatafile:

3251

if self._sidedatafile:

3252

sidedata_end = self.sidedata_cut_off(rev)

3252

sidedata_end = self.sidedata_cut_off(rev)

3253

transaction.add(self._sidedatafile, sidedata_end)

3253

transaction.add(self._sidedatafile, sidedata_end)

3254

3255

transaction.add(self._indexfile, end)

3255

transaction.add(self._indexfile, end)

3256

if self._docket is not None:

3256

if self._docket is not None:

3257

# XXX we could, leverage the docket while stripping. However it is

3257

# XXX we could, leverage the docket while stripping. However it is

3258

# not powerfull enough at the time of this comment

3258

# not powerfull enough at the time of this comment

3259

self._docket.index_end = end

3259

self._docket.index_end = end

3260

self._docket.data_end = data_end

3260

self._docket.data_end = data_end

3261

self._docket.sidedata_end = sidedata_end

3261

self._docket.sidedata_end = sidedata_end

3262

self._docket.write(transaction, stripping=True)

3262

self._docket.write(transaction, stripping=True)

3263

3264

# then reset internal state in memory to forget those revisions

3264

# then reset internal state in memory to forget those revisions

3265

self._revisioncache = None

3265

self._revisioncache = None

3266

self._chaininfocache = util.lrucachedict(500)

3266

self._chaininfocache = util.lrucachedict(500)

3267

self._segmentfile.clear_cache()

3267

self._segmentfile.clear_cache()

3268

self._segmentfile_sidedata.clear_cache()

3268

self._segmentfile_sidedata.clear_cache()

3269

3270

del self.index[rev:-1]

3270

del self.index[rev:-1]

3271

3272

def checksize(self):

3272

def checksize(self):

3273

"""Check size of index and data files

3273

"""Check size of index and data files

3274

3275

return a (dd, di) tuple.

3275

return a (dd, di) tuple.

3276

- dd: extra bytes for the "data" file

3276

- dd: extra bytes for the "data" file

3277

- di: extra bytes for the "index" file

3277

- di: extra bytes for the "index" file

3278

3279

A healthy revlog will return (0, 0).

3279

A healthy revlog will return (0, 0).

3280

"""

3280

"""

3281

expected = 0

3281

expected = 0

3282

if len(self):

3282

if len(self):

3283

expected = max(0, self.end(len(self) - 1))

3283

expected = max(0, self.end(len(self) - 1))

3284

3285

try:

3285

try:

3286

with self._datafp() as f:

3286

with self._datafp() as f:

3287

f.seek(0, io.SEEK_END)

3287

f.seek(0, io.SEEK_END)

3288

actual = f.tell()

3288

actual = f.tell()

3289

dd = actual - expected

3289

dd = actual - expected

3290

except FileNotFoundError:

3290

except FileNotFoundError:

3291

dd = 0

3291

dd = 0

3292

3293

try:

3293

try:

3294

f = self.opener(self._indexfile)

3294

f = self.opener(self._indexfile)

3295

f.seek(0, io.SEEK_END)

3295

f.seek(0, io.SEEK_END)

3296

actual = f.tell()

3296

actual = f.tell()

3297

f.close()

3297

f.close()

3298

s = self.index.entry_size

3298

s = self.index.entry_size

3299

i = max(0, actual // s)

3299

i = max(0, actual // s)

3300

di = actual - (i * s)

3300

di = actual - (i * s)

3301

if self._inline:

3301

if self._inline:

3302

databytes = 0

3302

databytes = 0

3303

for r in self:

3303

for r in self:

3304

databytes += max(0, self.length(r))

3304

databytes += max(0, self.length(r))

3305

dd = 0

3305

dd = 0

3306

di = actual - len(self) * s - databytes

3306

di = actual - len(self) * s - databytes

3307

except FileNotFoundError:

3307

except FileNotFoundError:

3308

di = 0

3308

di = 0

3309

3310

return (dd, di)

3310

return (dd, di)

3311

3312

def files(self):

3312

def files(self):

3313

res = [self._indexfile]

3313

res = [self._indexfile]

3314

if self._docket_file is None:

3314

if self._docket_file is None:

3315

if not self._inline:

3315

if not self._inline:

3316

res.append(self._datafile)

3316

res.append(self._datafile)

3317

else:

3317

else:

3318

res.append(self._docket_file)

3318

res.append(self._docket_file)

3319

res.extend(self._docket.old_index_filepaths(include_empty=False))

3319

res.extend(self._docket.old_index_filepaths(include_empty=False))

3320

if self._docket.data_end:

3320

if self._docket.data_end:

3321

res.append(self._datafile)

3321

res.append(self._datafile)

3322

res.extend(self._docket.old_data_filepaths(include_empty=False))

3322

res.extend(self._docket.old_data_filepaths(include_empty=False))

3323

if self._docket.sidedata_end:

3323

if self._docket.sidedata_end:

3324

res.append(self._sidedatafile)

3324

res.append(self._sidedatafile)

3325

res.extend(self._docket.old_sidedata_filepaths(include_empty=False))

3325

res.extend(self._docket.old_sidedata_filepaths(include_empty=False))

3326

return res

3326

return res

3327

3328

def emitrevisions(

3328

def emitrevisions(

3329

self,

3329

self,

3330

nodes,

3330

nodes,

3331

nodesorder=None,

3331

nodesorder=None,

3332

revisiondata=False,

3332

revisiondata=False,

3333

assumehaveparentrevisions=False,

3333

assumehaveparentrevisions=False,

3334

deltamode=repository.CG_DELTAMODE_STD,

3334

deltamode=repository.CG_DELTAMODE_STD,

3335

sidedata_helpers=None,

3335

sidedata_helpers=None,

3336

debug_info=None,

3336

debug_info=None,

3337

):

3337

):

3338

if nodesorder not in (b'nodes', b'storage', b'linear', None):

3338

if nodesorder not in (b'nodes', b'storage', b'linear', None):

3339

raise error.ProgrammingError(

3339

raise error.ProgrammingError(

3340

b'unhandled value for nodesorder: %s' % nodesorder

3340

b'unhandled value for nodesorder: %s' % nodesorder

3341

)

3341

)

3342

3343

if nodesorder is None and not self.delta_config.general_delta:

3343

if nodesorder is None and not self.delta_config.general_delta:

3344

nodesorder = b'storage'

3344

nodesorder = b'storage'

3345

3346

if (

3346

if (

3347

not self._storedeltachains

3347

not self._storedeltachains

3348

and deltamode != repository.CG_DELTAMODE_PREV

3348

and deltamode != repository.CG_DELTAMODE_PREV

3349

):

3349

):

3350

deltamode = repository.CG_DELTAMODE_FULL

3350

deltamode = repository.CG_DELTAMODE_FULL

3351

3352

return storageutil.emitrevisions(

3352

return storageutil.emitrevisions(

3353

self,

3353

self,

3354

nodes,

3354

nodes,

3355

nodesorder,

3355

nodesorder,

3356

revlogrevisiondelta,

3356

revlogrevisiondelta,

3357

deltaparentfn=self.deltaparent,

3357

deltaparentfn=self.deltaparent,

3358

candeltafn=self._candelta,

3358

candeltafn=self._candelta,

3359

rawsizefn=self.rawsize,

3359

rawsizefn=self.rawsize,

3360

revdifffn=self.revdiff,

3360

revdifffn=self.revdiff,

3361

flagsfn=self.flags,

3361

flagsfn=self.flags,

3362

deltamode=deltamode,

3362

deltamode=deltamode,

3363

revisiondata=revisiondata,

3363

revisiondata=revisiondata,

3364

assumehaveparentrevisions=assumehaveparentrevisions,

3364

assumehaveparentrevisions=assumehaveparentrevisions,

3365

sidedata_helpers=sidedata_helpers,

3365

sidedata_helpers=sidedata_helpers,

3366

debug_info=debug_info,

3366

debug_info=debug_info,

3367

)

3367

)

3368

3369

DELTAREUSEALWAYS = b'always'

3369

DELTAREUSEALWAYS = b'always'

3370

DELTAREUSESAMEREVS = b'samerevs'

3370

DELTAREUSESAMEREVS = b'samerevs'

3371

DELTAREUSENEVER = b'never'

3371

DELTAREUSENEVER = b'never'

3372

3373

DELTAREUSEFULLADD = b'fulladd'

3373

DELTAREUSEFULLADD = b'fulladd'

3374

3375

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

3375

DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}

3376

3377

def clone(

3377

def clone(

3378

self,

3378

self,

3379

tr,

3379

tr,

3380

destrevlog,

3380

destrevlog,

3381

addrevisioncb=None,

3381

addrevisioncb=None,

3382

deltareuse=DELTAREUSESAMEREVS,

3382

deltareuse=DELTAREUSESAMEREVS,

3383

forcedeltabothparents=None,

3383

forcedeltabothparents=None,

3384

sidedata_helpers=None,

3384

sidedata_helpers=None,

3385

):

3385

):

3386

"""Copy this revlog to another, possibly with format changes.

3386

"""Copy this revlog to another, possibly with format changes.

3387

3388

The destination revlog will contain the same revisions and nodes.

3388

The destination revlog will contain the same revisions and nodes.

3389

However, it may not be bit-for-bit identical due to e.g. delta encoding

3389

However, it may not be bit-for-bit identical due to e.g. delta encoding

3390

differences.

3390

differences.

3391

3392

The ``deltareuse`` argument control how deltas from the existing revlog

3392

The ``deltareuse`` argument control how deltas from the existing revlog

3393

are preserved in the destination revlog. The argument can have the

3393

are preserved in the destination revlog. The argument can have the

3394

following values:

3394

following values:

3395

3396

DELTAREUSEALWAYS

3396

DELTAREUSEALWAYS

3397

Deltas will always be reused (if possible), even if the destination

3397

Deltas will always be reused (if possible), even if the destination

3398

revlog would not select the same revisions for the delta. This is the

3398

revlog would not select the same revisions for the delta. This is the

3399

fastest mode of operation.

3399

fastest mode of operation.

3400

DELTAREUSESAMEREVS

3400

DELTAREUSESAMEREVS

3401

Deltas will be reused if the destination revlog would pick the same

3401

Deltas will be reused if the destination revlog would pick the same

3402

revisions for the delta. This mode strikes a balance between speed

3402

revisions for the delta. This mode strikes a balance between speed

3403

and optimization.

3403

and optimization.

3404

DELTAREUSENEVER

3404

DELTAREUSENEVER

3405

Deltas will never be reused. This is the slowest mode of execution.

3405

Deltas will never be reused. This is the slowest mode of execution.

3406

This mode can be used to recompute deltas (e.g. if the diff/delta

3406

This mode can be used to recompute deltas (e.g. if the diff/delta

3407

algorithm changes).

3407

algorithm changes).

3408

DELTAREUSEFULLADD

3408

DELTAREUSEFULLADD

3409

Revision will be re-added as if their were new content. This is

3409

Revision will be re-added as if their were new content. This is

3410

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

3410

slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.

3411

eg: large file detection and handling.

3411

eg: large file detection and handling.

3412

3413

Delta computation can be slow, so the choice of delta reuse policy can

3413

Delta computation can be slow, so the choice of delta reuse policy can

3414

significantly affect run time.

3414

significantly affect run time.

3415

3416

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

3416

The default policy (``DELTAREUSESAMEREVS``) strikes a balance between

3417

two extremes. Deltas will be reused if they are appropriate. But if the

3417

two extremes. Deltas will be reused if they are appropriate. But if the

3418

delta could choose a better revision, it will do so. This means if you

3418

delta could choose a better revision, it will do so. This means if you

3419

are converting a non-generaldelta revlog to a generaldelta revlog,

3419

are converting a non-generaldelta revlog to a generaldelta revlog,

3420

deltas will be recomputed if the delta's parent isn't a parent of the

3420

deltas will be recomputed if the delta's parent isn't a parent of the

3421

revision.

3421

revision.

3422

3423

In addition to the delta policy, the ``forcedeltabothparents``

3423

In addition to the delta policy, the ``forcedeltabothparents``

3424

argument controls whether to force compute deltas against both parents

3424

argument controls whether to force compute deltas against both parents

3425

for merges. By default, the current default is used.

3425

for merges. By default, the current default is used.

3426

3427

See `revlogutil.sidedata.get_sidedata_helpers` for the doc on

3427

See `revlogutil.sidedata.get_sidedata_helpers` for the doc on

3428

`sidedata_helpers`.

3428

`sidedata_helpers`.

3429

"""

3429

"""

3430

if deltareuse not in self.DELTAREUSEALL:

3430

if deltareuse not in self.DELTAREUSEALL:

3431

raise ValueError(

3431

raise ValueError(

3432

_(b'value for deltareuse invalid: %s') % deltareuse

3432

_(b'value for deltareuse invalid: %s') % deltareuse

3433

)

3433

)

3434

3435

if len(destrevlog):

3435

if len(destrevlog):

3436

raise ValueError(_(b'destination revlog is not empty'))

3436

raise ValueError(_(b'destination revlog is not empty'))

3437

3438

if getattr(self, 'filteredrevs', None):

3438

if getattr(self, 'filteredrevs', None):

3439

raise ValueError(_(b'source revlog has filtered revisions'))

3439

raise ValueError(_(b'source revlog has filtered revisions'))

3440

if getattr(destrevlog, 'filteredrevs', None):

3440

if getattr(destrevlog, 'filteredrevs', None):

3441

raise ValueError(_(b'destination revlog has filtered revisions'))

3441

raise ValueError(_(b'destination revlog has filtered revisions'))

3442

3443

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

3443

# lazydelta and lazydeltabase controls whether to reuse a cached delta,

3444

# if possible.

3444

# if possible.

3445

old_delta_config = destrevlog.delta_config

3445

old_delta_config = destrevlog.delta_config

3446

destrevlog.delta_config = destrevlog.delta_config.copy()

3446

destrevlog.delta_config = destrevlog.delta_config.copy()

3447

3448

try:

3448

try:

3449

if deltareuse == self.DELTAREUSEALWAYS:

3449

if deltareuse == self.DELTAREUSEALWAYS:

3450

destrevlog.delta_config.lazy_delta_base = True

3450

destrevlog.delta_config.lazy_delta_base = True

3451

destrevlog.delta_config.lazy_delta = True

3451

destrevlog.delta_config.lazy_delta = True

3452

elif deltareuse == self.DELTAREUSESAMEREVS:

3452

elif deltareuse == self.DELTAREUSESAMEREVS:

3453

destrevlog.delta_config.lazy_delta_base = False

3453

destrevlog.delta_config.lazy_delta_base = False

3454

destrevlog.delta_config.lazy_delta = True

3454

destrevlog.delta_config.lazy_delta = True

3455

elif deltareuse == self.DELTAREUSENEVER:

3455

elif deltareuse == self.DELTAREUSENEVER:

3456

destrevlog.delta_config.lazy_delta_base = False

3456

destrevlog.delta_config.lazy_delta_base = False

3457

destrevlog.delta_config.lazy_delta = False

3457

destrevlog.delta_config.lazy_delta = False

3458

3459

delta_both_parents = (

3459

delta_both_parents = (

3460

forcedeltabothparents or old_delta_config.delta_both_parents

3460

forcedeltabothparents or old_delta_config.delta_both_parents

3461

)

3461

)

3462

destrevlog.delta_config.delta_both_parents = delta_both_parents

3462

destrevlog.delta_config.delta_both_parents = delta_both_parents

3463

3464

with self.reading():

3464

with self.reading():

3465

self._clone(

3465

self._clone(

3466

tr,

3466

tr,

3467

destrevlog,

3467

destrevlog,

3468

addrevisioncb,

3468

addrevisioncb,

3469

deltareuse,

3469

deltareuse,

3470

forcedeltabothparents,

3470

forcedeltabothparents,

3471

sidedata_helpers,

3471

sidedata_helpers,

3472

)

3472

)

3473

3474

finally:

3474

finally:

3475

destrevlog.delta_config = old_delta_config

3475

destrevlog.delta_config = old_delta_config

3476

3477

def _clone(

3477

def _clone(

3478

self,

3478

self,

3479

tr,

3479

tr,

3480

destrevlog,

3480

destrevlog,

3481

addrevisioncb,

3481

addrevisioncb,

3482

deltareuse,

3482

deltareuse,

3483

forcedeltabothparents,

3483

forcedeltabothparents,

3484

sidedata_helpers,

3484

sidedata_helpers,

3485

):

3485

):

3486

"""perform the core duty of `revlog.clone` after parameter processing"""

3486

"""perform the core duty of `revlog.clone` after parameter processing"""

3487

write_debug = None

3487

write_debug = None

3488

if self.delta_config.debug_delta:

3488

if self.delta_config.debug_delta:

3489

write_debug = tr._report

3489

write_debug = tr._report

3490

deltacomputer = deltautil.deltacomputer(

3490

deltacomputer = deltautil.deltacomputer(

3491

destrevlog,

3491

destrevlog,

3492

write_debug=write_debug,

3492

write_debug=write_debug,

3493

)

3493

)

3494

index = self.index

3494

index = self.index

3495

for rev in self:

3495

for rev in self:

3496

entry = index[rev]

3496

entry = index[rev]

3497

3498

# Some classes override linkrev to take filtered revs into

3498

# Some classes override linkrev to take filtered revs into

3499

# account. Use raw entry from index.

3499

# account. Use raw entry from index.

3500

flags = entry[0] & 0xFFFF

3500

flags = entry[0] & 0xFFFF

3501

linkrev = entry[4]

3501

linkrev = entry[4]

3502

p1 = index[entry[5]][7]

3502

p1 = index[entry[5]][7]

3503

p2 = index[entry[6]][7]

3503

p2 = index[entry[6]][7]

3504

node = entry[7]

3504

node = entry[7]

3505

3506

# (Possibly) reuse the delta from the revlog if allowed and

3506

# (Possibly) reuse the delta from the revlog if allowed and

3507

# the revlog chunk is a delta.

3507

# the revlog chunk is a delta.

3508

cachedelta = None

3508

cachedelta = None

3509

rawtext = None

3509

rawtext = None

3510

if deltareuse == self.DELTAREUSEFULLADD:

3510

if deltareuse == self.DELTAREUSEFULLADD:

3511

text = self._revisiondata(rev)

3511

text = self._revisiondata(rev)

3512

sidedata = self.sidedata(rev)

3512

sidedata = self.sidedata(rev)

3513

3514

if sidedata_helpers is not None:

3514

if sidedata_helpers is not None:

3515

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3515

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3516

self, sidedata_helpers, sidedata, rev

3516

self, sidedata_helpers, sidedata, rev

3517

)

3517

)

3518

flags = flags | new_flags[0] & ~new_flags[1]

3518

flags = flags | new_flags[0] & ~new_flags[1]

3519

3520

destrevlog.addrevision(

3520

destrevlog.addrevision(

3521

text,

3521

text,

3522

tr,

3522

tr,

3523

linkrev,

3523

linkrev,

3524

p1,

3524

p1,

3525

p2,

3525

p2,

3526

cachedelta=cachedelta,

3526

cachedelta=cachedelta,

3527

node=node,

3527

node=node,

3528

flags=flags,

3528

flags=flags,

3529

deltacomputer=deltacomputer,

3529

deltacomputer=deltacomputer,

3530

sidedata=sidedata,

3530

sidedata=sidedata,

3531

)

3531

)

3532

else:

3532

else:

3533

if destrevlog.delta_config.lazy_delta:

3533

if destrevlog.delta_config.lazy_delta:

3534

dp = self.deltaparent(rev)

3534

dp = self.deltaparent(rev)

3535

if dp != nullrev:

3535

if dp != nullrev:

3536

cachedelta = (dp, bytes(self._chunk(rev)))

3536

cachedelta = (dp, bytes(self._chunk(rev)))

3537

3538

sidedata = None

3538

sidedata = None

3539

if not cachedelta:

3539

if not cachedelta:

3540

try:

3540

rawtext = self._revisiondata(rev)

3541

rawtext = self._revisiondata(rev)

3542

except error.CensoredNodeError as censored:

3543

assert flags & REVIDX_ISCENSORED

3544

rawtext = censored.tombstone

3541

sidedata = self.sidedata(rev)

3545

sidedata = self.sidedata(rev)

3542

if sidedata is None:

3546

if sidedata is None:

3543

sidedata = self.sidedata(rev)

3547

sidedata = self.sidedata(rev)

3544

3548

3545

if sidedata_helpers is not None:

3549

if sidedata_helpers is not None:

3546

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3550

(sidedata, new_flags) = sidedatautil.run_sidedata_helpers(

3547

self, sidedata_helpers, sidedata, rev

3551

self, sidedata_helpers, sidedata, rev

3548

)

3552

)

3549

flags = flags | new_flags[0] & ~new_flags[1]

3553

flags = flags | new_flags[0] & ~new_flags[1]

3550

3554

3551

with destrevlog._writing(tr):

3555

with destrevlog._writing(tr):

3552

destrevlog._addrevision(

3556

destrevlog._addrevision(

3553

node,

3557

node,

3554

rawtext,

3558

rawtext,

3555

tr,

3559

tr,

3556

linkrev,

3560

linkrev,

3557

p1,

3561

p1,

3558

p2,

3562

p2,

3559

flags,

3563

flags,

3560

cachedelta,

3564

cachedelta,

3561

deltacomputer=deltacomputer,

3565

deltacomputer=deltacomputer,

3562

sidedata=sidedata,

3566

sidedata=sidedata,

3563

)

3567

)

3564

3568

3565

if addrevisioncb:

3569

if addrevisioncb:

3566

addrevisioncb(self, rev, node)

3570

addrevisioncb(self, rev, node)

3567

3571

3568

def censorrevision(self, tr, censornode, tombstone=b''):

3572

def censorrevision(self, tr, censornode, tombstone=b''):

3569

if self._format_version == REVLOGV0:

3573

if self._format_version == REVLOGV0:

3570

raise error.RevlogError(

3574

raise error.RevlogError(

3571

_(b'cannot censor with version %d revlogs')

3575

_(b'cannot censor with version %d revlogs')

3572

% self._format_version

3576

% self._format_version

3573

)

3577

)

3574

elif self._format_version == REVLOGV1:

3578

elif self._format_version == REVLOGV1:

3575

rewrite.v1_censor(self, tr, censornode, tombstone)

3579

rewrite.v1_censor(self, tr, censornode, tombstone)

3576

else:

3580

else:

3577

rewrite.v2_censor(self, tr, censornode, tombstone)

3581

rewrite.v2_censor(self, tr, censornode, tombstone)

3578

3582

3579

def verifyintegrity(self, state):

3583

def verifyintegrity(self, state):

3580

"""Verifies the integrity of the revlog.

3584

"""Verifies the integrity of the revlog.

3581

3585

3582

Yields ``revlogproblem`` instances describing problems that are

3586

Yields ``revlogproblem`` instances describing problems that are

3583

found.

3587

found.

3584

"""

3588

"""

3585

dd, di = self.checksize()

3589

dd, di = self.checksize()

3586

if dd:

3590

if dd:

3587

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

3591

yield revlogproblem(error=_(b'data length off by %d bytes') % dd)

3588

if di:

3592

if di:

3589

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

3593

yield revlogproblem(error=_(b'index contains %d extra bytes') % di)

3590

3594

3591

version = self._format_version

3595

version = self._format_version

3592

3596

3593

# The verifier tells us what version revlog we should be.

3597

# The verifier tells us what version revlog we should be.

3594

if version != state[b'expectedversion']:

3598

if version != state[b'expectedversion']:

3595

yield revlogproblem(

3599

yield revlogproblem(

3596

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

3600

warning=_(b"warning: '%s' uses revlog format %d; expected %d")

3597

% (self.display_id, version, state[b'expectedversion'])

3601

% (self.display_id, version, state[b'expectedversion'])

3598

)

3602

)

3599

3603

3600

state[b'skipread'] = set()

3604

state[b'skipread'] = set()

3601

state[b'safe_renamed'] = set()

3605

state[b'safe_renamed'] = set()

3602

3606

3603

for rev in self:

3607

for rev in self:

3604

node = self.node(rev)

3608

node = self.node(rev)

3605

3609

3606

# Verify contents. 4 cases to care about:

3610

# Verify contents. 4 cases to care about:

3607

#

3611

#

3608

# common: the most common case

3612

# common: the most common case

3609

# rename: with a rename

3613

# rename: with a rename

3610

# meta: file content starts with b'\1\n', the metadata

3614

# meta: file content starts with b'\1\n', the metadata

3611

# header defined in filelog.py, but without a rename

3615

# header defined in filelog.py, but without a rename

3612

# ext: content stored externally

3616

# ext: content stored externally

3613

#

3617

#

3614

# More formally, their differences are shown below:

3618

# More formally, their differences are shown below:

3615

#

3619

#

3616

# | common | rename | meta | ext

3620

# | common | rename | meta | ext

3617

# -------------------------------------------------------

3621

# -------------------------------------------------------

3618

# flags() | 0 | 0 | 0 | not 0

3622

# flags() | 0 | 0 | 0 | not 0

3619

# renamed() | False | True | False | ?

3623

# renamed() | False | True | False | ?

3620

# rawtext[0:2]=='\1\n'| False | True | True | ?

3624

# rawtext[0:2]=='\1\n'| False | True | True | ?

3621

#

3625

#

3622

# "rawtext" means the raw text stored in revlog data, which

3626

# "rawtext" means the raw text stored in revlog data, which

3623

# could be retrieved by "rawdata(rev)". "text"

3627

# could be retrieved by "rawdata(rev)". "text"

3624

# mentioned below is "revision(rev)".

3628

# mentioned below is "revision(rev)".

3625

#

3629

#

3626

# There are 3 different lengths stored physically:

3630

# There are 3 different lengths stored physically:

3627

# 1. L1: rawsize, stored in revlog index

3631

# 1. L1: rawsize, stored in revlog index

3628

# 2. L2: len(rawtext), stored in revlog data

3632

# 2. L2: len(rawtext), stored in revlog data

3629

# 3. L3: len(text), stored in revlog data if flags==0, or

3633

# 3. L3: len(text), stored in revlog data if flags==0, or

3630

# possibly somewhere else if flags!=0

3634

# possibly somewhere else if flags!=0

3631

#

3635

#

3632

# L1 should be equal to L2. L3 could be different from them.

3636

# L1 should be equal to L2. L3 could be different from them.

3633

# "text" may or may not affect commit hash depending on flag

3637

# "text" may or may not affect commit hash depending on flag

3634

# processors (see flagutil.addflagprocessor).

3638

# processors (see flagutil.addflagprocessor).

3635

#

3639

#

3636

# | common | rename | meta | ext

3640

# | common | rename | meta | ext

3637

# -------------------------------------------------

3641

# -------------------------------------------------

3638

# rawsize() | L1 | L1 | L1 | L1

3642

# rawsize() | L1 | L1 | L1 | L1

3639

# size() | L1 | L2-LM | L1(*) | L1 (?)

3643

# size() | L1 | L2-LM | L1(*) | L1 (?)

3640

# len(rawtext) | L2 | L2 | L2 | L2

3644

# len(rawtext) | L2 | L2 | L2 | L2

3641

# len(text) | L2 | L2 | L2 | L3

3645

# len(text) | L2 | L2 | L2 | L3

3642

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

3646

# len(read()) | L2 | L2-LM | L2-LM | L3 (?)

3643

#

3647

#

3644

# LM: length of metadata, depending on rawtext

3648

# LM: length of metadata, depending on rawtext

3645

# (*): not ideal, see comment in filelog.size

3649

# (*): not ideal, see comment in filelog.size

3646

# (?): could be "- len(meta)" if the resolved content has

3650

# (?): could be "- len(meta)" if the resolved content has

3647

# rename metadata

3651

# rename metadata

3648

#

3652

#

3649

# Checks needed to be done:

3653

# Checks needed to be done:

3650

# 1. length check: L1 == L2, in all cases.

3654

# 1. length check: L1 == L2, in all cases.

3651

# 2. hash check: depending on flag processor, we may need to

3655

# 2. hash check: depending on flag processor, we may need to

3652

# use either "text" (external), or "rawtext" (in revlog).

3656

# use either "text" (external), or "rawtext" (in revlog).

3653

3657

3654

try:

3658

try:

3655

skipflags = state.get(b'skipflags', 0)

3659

skipflags = state.get(b'skipflags', 0)

3656

if skipflags:

3660

if skipflags:

3657

skipflags &= self.flags(rev)

3661

skipflags &= self.flags(rev)

3658

3662

3659

_verify_revision(self, skipflags, state, node)

3663

_verify_revision(self, skipflags, state, node)

3660

3664

3661

l1 = self.rawsize(rev)

3665

l1 = self.rawsize(rev)

3662

l2 = len(self.rawdata(node))

3666

l2 = len(self.rawdata(node))

3663

3667

3664

if l1 != l2:

3668

if l1 != l2:

3665

yield revlogproblem(

3669

yield revlogproblem(

3666

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

3670

error=_(b'unpacked size is %d, %d expected') % (l2, l1),

3667

node=node,

3671

node=node,

3668

)

3672

)

3669

3673

3670

except error.CensoredNodeError:

3674

except error.CensoredNodeError:

3671

if state[b'erroroncensored']:

3675

if state[b'erroroncensored']:

3672

yield revlogproblem(

3676

yield revlogproblem(

3673

error=_(b'censored file data'), node=node

3677

error=_(b'censored file data'), node=node

3674

)

3678

)

3675

state[b'skipread'].add(node)

3679

state[b'skipread'].add(node)

3676

except Exception as e:

3680

except Exception as e:

3677

yield revlogproblem(

3681

yield revlogproblem(

3678

error=_(b'unpacking %s: %s')

3682

error=_(b'unpacking %s: %s')

3679

% (short(node), stringutil.forcebytestr(e)),

3683

% (short(node), stringutil.forcebytestr(e)),

3680

node=node,

3684

node=node,

3681

)

3685

)

3682

state[b'skipread'].add(node)

3686

state[b'skipread'].add(node)

3683

3687

3684

def storageinfo(

3688

def storageinfo(

3685

self,

3689

self,

3686

exclusivefiles=False,

3690

exclusivefiles=False,

3687

sharedfiles=False,

3691

sharedfiles=False,

3688

revisionscount=False,

3692

revisionscount=False,

3689

trackedsize=False,

3693

trackedsize=False,

3690

storedsize=False,

3694

storedsize=False,

3691

):

3695

):

3692

d = {}

3696

d = {}

3693

3697

3694

if exclusivefiles:

3698

if exclusivefiles:

3695

d[b'exclusivefiles'] = [(self.opener, self._indexfile)]

3699

d[b'exclusivefiles'] = [(self.opener, self._indexfile)]

3696

if not self._inline:

3700

if not self._inline:

3697

d[b'exclusivefiles'].append((self.opener, self._datafile))

3701

d[b'exclusivefiles'].append((self.opener, self._datafile))

3698

3702

3699

if sharedfiles:

3703

if sharedfiles:

3700

d[b'sharedfiles'] = []

3704

d[b'sharedfiles'] = []

3701

3705

3702

if revisionscount:

3706

if revisionscount:

3703

d[b'revisionscount'] = len(self)

3707

d[b'revisionscount'] = len(self)

3704

3708

3705

if trackedsize:

3709

if trackedsize:

3706

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

3710

d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))

3707

3711

3708

if storedsize:

3712

if storedsize:

3709

d[b'storedsize'] = sum(

3713

d[b'storedsize'] = sum(

3710

self.opener.stat(path).st_size for path in self.files()

3714

self.opener.stat(path).st_size for path in self.files()

3711

)

3715

)

3712

3716

3713

return d

3717

return d

3714

3718

3715

def rewrite_sidedata(self, transaction, helpers, startrev, endrev):

3719

def rewrite_sidedata(self, transaction, helpers, startrev, endrev):

3716

if not self.feature_config.has_side_data:

3720

if not self.feature_config.has_side_data:

3717

return

3721

return

3718

# revlog formats with sidedata support does not support inline

3722

# revlog formats with sidedata support does not support inline

3719

assert not self._inline

3723

assert not self._inline

3720

if not helpers[1] and not helpers[2]:

3724

if not helpers[1] and not helpers[2]:

3721

# Nothing to generate or remove

3725

# Nothing to generate or remove

3722

return

3726

return

3723

3727

3724

new_entries = []

3728

new_entries = []

3725

# append the new sidedata

3729

# append the new sidedata

3726

with self._writing(transaction):

3730

with self._writing(transaction):

3727

ifh, dfh, sdfh = self._writinghandles

3731

ifh, dfh, sdfh = self._writinghandles

3728

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

3732

dfh.seek(self._docket.sidedata_end, os.SEEK_SET)

3729

3733

3730

current_offset = sdfh.tell()

3734

current_offset = sdfh.tell()

3731

for rev in range(startrev, endrev + 1):

3735

for rev in range(startrev, endrev + 1):

3732

entry = self.index[rev]

3736

entry = self.index[rev]

3733

new_sidedata, flags = sidedatautil.run_sidedata_helpers(

3737

new_sidedata, flags = sidedatautil.run_sidedata_helpers(

3734

store=self,

3738

store=self,

3735

sidedata_helpers=helpers,

3739

sidedata_helpers=helpers,

3736

sidedata={},

3740

sidedata={},

3737

rev=rev,

3741

rev=rev,

3738

)

3742

)

3739

3743

3740

serialized_sidedata = sidedatautil.serialize_sidedata(

3744

serialized_sidedata = sidedatautil.serialize_sidedata(

3741

new_sidedata

3745

new_sidedata

3742

)

3746

)

3743

3747

3744

sidedata_compression_mode = COMP_MODE_INLINE

3748

sidedata_compression_mode = COMP_MODE_INLINE

3745

if serialized_sidedata and self.feature_config.has_side_data:

3749

if serialized_sidedata and self.feature_config.has_side_data:

3746

sidedata_compression_mode = COMP_MODE_PLAIN

3750

sidedata_compression_mode = COMP_MODE_PLAIN

3747

h, comp_sidedata = self.compress(serialized_sidedata)

3751

h, comp_sidedata = self.compress(serialized_sidedata)

3748

if (

3752

if (

3749

h != b'u'

3753

h != b'u'

3750

and comp_sidedata[0] != b'\0'

3754

and comp_sidedata[0] != b'\0'

3751

and len(comp_sidedata) < len(serialized_sidedata)

3755

and len(comp_sidedata) < len(serialized_sidedata)

3752

):

3756

):

3753

assert not h

3757

assert not h

3754

if (

3758

if (

3755

comp_sidedata[0]

3759

comp_sidedata[0]

3756

== self._docket.default_compression_header

3760

== self._docket.default_compression_header

3757

):

3761

):

3758

sidedata_compression_mode = COMP_MODE_DEFAULT

3762

sidedata_compression_mode = COMP_MODE_DEFAULT

3759

serialized_sidedata = comp_sidedata

3763

serialized_sidedata = comp_sidedata

3760

else:

3764

else:

3761

sidedata_compression_mode = COMP_MODE_INLINE

3765

sidedata_compression_mode = COMP_MODE_INLINE

3762

serialized_sidedata = comp_sidedata

3766

serialized_sidedata = comp_sidedata

3763

if entry[8] != 0 or entry[9] != 0:

3767

if entry[8] != 0 or entry[9] != 0:

3764

# rewriting entries that already have sidedata is not

3768

# rewriting entries that already have sidedata is not

3765

# supported yet, because it introduces garbage data in the

3769

# supported yet, because it introduces garbage data in the

3766

# revlog.

3770

# revlog.

3767

msg = b"rewriting existing sidedata is not supported yet"

3771

msg = b"rewriting existing sidedata is not supported yet"

3768

raise error.Abort(msg)

3772

raise error.Abort(msg)

3769

3773

3770

# Apply (potential) flags to add and to remove after running

3774

# Apply (potential) flags to add and to remove after running

3771

# the sidedata helpers

3775

# the sidedata helpers

3772

new_offset_flags = entry[0] | flags[0] & ~flags[1]

3776

new_offset_flags = entry[0] | flags[0] & ~flags[1]

3773

entry_update = (

3777

entry_update = (

3774

current_offset,

3778

current_offset,

3775

len(serialized_sidedata),

3779

len(serialized_sidedata),

3776

new_offset_flags,

3780

new_offset_flags,

3777

sidedata_compression_mode,

3781

sidedata_compression_mode,

3778

)

3782

)

3779

3783

3780

# the sidedata computation might have move the file cursors around

3784

# the sidedata computation might have move the file cursors around

3781

sdfh.seek(current_offset, os.SEEK_SET)

3785

sdfh.seek(current_offset, os.SEEK_SET)

3782

sdfh.write(serialized_sidedata)

3786

sdfh.write(serialized_sidedata)

3783

new_entries.append(entry_update)

3787

new_entries.append(entry_update)

3784

current_offset += len(serialized_sidedata)

3788

current_offset += len(serialized_sidedata)

3785

self._docket.sidedata_end = sdfh.tell()

3789

self._docket.sidedata_end = sdfh.tell()

3786

3790

3787

# rewrite the new index entries

3791

# rewrite the new index entries

3788

ifh.seek(startrev * self.index.entry_size)

3792

ifh.seek(startrev * self.index.entry_size)

3789

for i, e in enumerate(new_entries):

3793

for i, e in enumerate(new_entries):

3790

rev = startrev + i

3794

rev = startrev + i

3791

self.index.replace_sidedata_info(rev, *e)

3795

self.index.replace_sidedata_info(rev, *e)

3792

packed = self.index.entry_binary(rev)

3796

packed = self.index.entry_binary(rev)

3793

if rev == 0 and self._docket is None:

3797

if rev == 0 and self._docket is None:

3794

header = self._format_flags | self._format_version

3798

header = self._format_flags | self._format_version

3795

header = self.index.pack_header(header)

3799

header = self.index.pack_header(header)

3796

packed = header + packed

3800

packed = header + packed

3797

ifh.write(packed)

3801

ifh.write(packed)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # revlog.py - storage back-end for mercurial
             # coding: utf8
             #
             # Copyright 2005-2007 Olivia Mackall <olivia@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             import binascii
             import collections
             import contextlib
             import io
             import os
             import struct
             import weakref
             import zlib
             # import stuff from node for others to import from revlog
             from .node import (
                 bin,
                 hex,
                 nullrev,
                 sha1nodeconstants,
                 short,
                 wdirrev,
             )
             from .i18n import _
             from .revlogutils.constants import (
                 ALL_KINDS,
                 CHANGELOGV2,
                 COMP_MODE_DEFAULT,
                 COMP_MODE_INLINE,
                 COMP_MODE_PLAIN,
                 DELTA_BASE_REUSE_NO,
                 DELTA_BASE_REUSE_TRY,
                 ENTRY_RANK,
                 FEATURES_BY_VERSION,
                 FLAG_GENERALDELTA,
                 FLAG_INLINE_DATA,
                 INDEX_HEADER,
                 KIND_CHANGELOG,
                 KIND_FILELOG,
                 RANK_UNKNOWN,
                 REVLOGV0,
                 REVLOGV1,
                 REVLOGV1_FLAGS,
                 REVLOGV2,
                 REVLOGV2_FLAGS,
                 REVLOG_DEFAULT_FLAGS,
                 REVLOG_DEFAULT_FORMAT,
                 REVLOG_DEFAULT_VERSION,
                 SUPPORTED_FLAGS,
             )
             from .revlogutils.flagutil import (
                 REVIDX_DEFAULT_FLAGS,
                 REVIDX_ELLIPSIS,
                 REVIDX_EXTSTORED,
                 REVIDX_FLAGS_ORDER,
                 REVIDX_HASCOPIESINFO,
                 REVIDX_ISCENSORED,
                 REVIDX_RAWTEXT_CHANGING_FLAGS,
             )
             from .thirdparty import attr
             from . import (
                 ancestor,
                 dagop,
                 error,
                 mdiff,
                 policy,
                 pycompat,
                 revlogutils,
                 templatefilters,
                 util,
             )
             from .interfaces import (
                 repository,
                 util as interfaceutil,
             )
             from .revlogutils import (
                 deltas as deltautil,
                 docket as docketutil,
                 flagutil,
                 nodemap as nodemaputil,
                 randomaccessfile,
                 revlogv0,
                 rewrite,
                 sidedata as sidedatautil,
             )
             from .utils import (
                 storageutil,
                 stringutil,
             )
             # blanked usage of all the name to prevent pyflakes constraints
             # We need these name available in the module for extensions.
             REVLOGV0
             REVLOGV1
             REVLOGV2
             CHANGELOGV2
             FLAG_INLINE_DATA
             FLAG_GENERALDELTA
             REVLOG_DEFAULT_FLAGS
             REVLOG_DEFAULT_FORMAT
             REVLOG_DEFAULT_VERSION
             REVLOGV1_FLAGS
             REVLOGV2_FLAGS
             REVIDX_ISCENSORED
             REVIDX_ELLIPSIS
             REVIDX_HASCOPIESINFO
             REVIDX_EXTSTORED
             REVIDX_DEFAULT_FLAGS
             REVIDX_FLAGS_ORDER
             REVIDX_RAWTEXT_CHANGING_FLAGS
             parsers = policy.importmod('parsers')
             rustancestor = policy.importrust('ancestor')
             rustdagop = policy.importrust('dagop')
             rustrevlog = policy.importrust('revlog')
             # Aliased for performance.
             _zlibdecompress = zlib.decompress
             # max size of inline data embedded into a revlog
             _maxinline = 131072
             # Flag processors for REVIDX_ELLIPSIS.
             def ellipsisreadprocessor(rl, text):
                 return text, False
             def ellipsiswriteprocessor(rl, text):
                 return text, False
             def ellipsisrawprocessor(rl, text):
                 return False
             ellipsisprocessor = (
                 ellipsisreadprocessor,
                 ellipsiswriteprocessor,
                 ellipsisrawprocessor,
             )
             def _verify_revision(rl, skipflags, state, node):
                 """Verify the integrity of the given revlog ``node`` while providing a hook
                 point for extensions to influence the operation."""
                 if skipflags:
                     state[b'skipread'].add(node)
                 else:
                     # Side-effect: read content and verify hash.
                     rl.revision(node)
             # True if a fast implementation for persistent-nodemap is available
             #
             # We also consider we have a "fast" implementation in "pure" python because
             # people using pure don't really have performance consideration (and a
             # wheelbarrow of other slowness source)
             HAS_FAST_PERSISTENT_NODEMAP = rustrevlog is not None or hasattr(
                 parsers, 'BaseIndexObject'
             )
             @interfaceutil.implementer(repository.irevisiondelta)
             @attr.s(slots=True)
             class revlogrevisiondelta:
                 node = attr.ib()
                 p1node = attr.ib()
                 p2node = attr.ib()
                 basenode = attr.ib()
                 flags = attr.ib()
                 baserevisionsize = attr.ib()
                 revision = attr.ib()
                 delta = attr.ib()
                 sidedata = attr.ib()
                 protocol_flags = attr.ib()
                 linknode = attr.ib(default=None)
             @interfaceutil.implementer(repository.iverifyproblem)
             @attr.s(frozen=True)
             class revlogproblem:
                 warning = attr.ib(default=None)
                 error = attr.ib(default=None)
                 node = attr.ib(default=None)
             def parse_index_v1(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline)
                 return index, cache
             def parse_index_v2(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline, format=REVLOGV2)
                 return index, cache
             def parse_index_cl_v2(data, inline):
                 # call the C implementation to parse the index data
                 index, cache = parsers.parse_index2(data, inline, format=CHANGELOGV2)
                 return index, cache
             if hasattr(parsers, 'parse_index_devel_nodemap'):
                 def parse_index_v1_nodemap(data, inline):
                     index, cache = parsers.parse_index_devel_nodemap(data, inline)
                     return index, cache
             else:
                 parse_index_v1_nodemap = None
             def parse_index_v1_mixed(data, inline):
                 index, cache = parse_index_v1(data, inline)
                 return rustrevlog.MixedIndex(index), cache
             # corresponds to uncompressed length of indexformatng (2 gigs, 4-byte
             # signed integer)
             _maxentrysize = 0x7FFFFFFF
             FILE_TOO_SHORT_MSG = _(
                 b'cannot read from revlog %s;'
                 b'  expected %d bytes from offset %d, data size is %d'
             )
             hexdigits = b'0123456789abcdefABCDEF'
             class _Config:
                 def copy(self):
                     return self.__class__(**self.__dict__)
             @attr.s()
             class FeatureConfig(_Config):
                 """Hold configuration values about the available revlog features"""
                 # the default compression engine
                 compression_engine = attr.ib(default=b'zlib')
                 # compression engines options
                 compression_engine_options = attr.ib(default=attr.Factory(dict))
                 # can we use censor on this revlog
                 censorable = attr.ib(default=False)
                 # does this revlog use the "side data" feature
                 has_side_data = attr.ib(default=False)
                 # might remove rank configuration once the computation has no impact
                 compute_rank = attr.ib(default=False)
                 # parent order is supposed to be semantically irrelevant, so we
                 # normally resort parents to ensure that the first parent is non-null,
                 # if there is a non-null parent at all.
                 # filelog abuses the parent order as flag to mark some instances of
                 # meta-encoded files, so allow it to disable this behavior.
                 canonical_parent_order = attr.ib(default=False)
                 # can ellipsis commit be used
                 enable_ellipsis = attr.ib(default=False)
                 def copy(self):
                     new = super().copy()
                     new.compression_engine_options = self.compression_engine_options.copy()
                     return new
             @attr.s()
             class DataConfig(_Config):
                 """Hold configuration value about how the revlog data are read"""
                 # should we try to open the "pending" version of the revlog
                 try_pending = attr.ib(default=False)
                 # should we try to open the "splitted" version of the revlog
                 try_split = attr.ib(default=False)
                 #  When True, indexfile should be opened with checkambig=True at writing,
                 #  to avoid file stat ambiguity.
                 check_ambig = attr.ib(default=False)
                 # If true, use mmap instead of reading to deal with large index
                 mmap_large_index = attr.ib(default=False)
                 # how much data is large
                 mmap_index_threshold = attr.ib(default=None)
                 # How much data to read and cache into the raw revlog data cache.
                 chunk_cache_size = attr.ib(default=65536)
                 # Allow sparse reading of the revlog data
                 with_sparse_read = attr.ib(default=False)
                 # minimal density of a sparse read chunk
                 sr_density_threshold = attr.ib(default=0.50)
                 # minimal size of data we skip when performing sparse read
                 sr_min_gap_size = attr.ib(default=262144)
                 # are delta encoded against arbitrary bases.
                 generaldelta = attr.ib(default=False)
             @attr.s()
             class DeltaConfig(_Config):
                 """Hold configuration value about how new delta are computed
                 Some attributes are duplicated from DataConfig to help havign each object
                 self contained.
                 """
                 # can delta be encoded against arbitrary bases.
                 general_delta = attr.ib(default=False)
                 # Allow sparse writing of the revlog data
                 sparse_revlog = attr.ib(default=False)
                 # maximum length of a delta chain
                 max_chain_len = attr.ib(default=None)
                 # Maximum distance between delta chain base start and end
                 max_deltachain_span = attr.ib(default=-1)
                 # If `upper_bound_comp` is not None, this is the expected maximal gain from
                 # compression for the data content.
                 upper_bound_comp = attr.ib(default=None)
                 # Should we try a delta against both parent
                 delta_both_parents = attr.ib(default=True)
                 # Test delta base candidate group by chunk of this maximal size.
                 candidate_group_chunk_size = attr.ib(default=0)
                 # Should we display debug information about delta computation
                 debug_delta = attr.ib(default=False)
                 # trust incoming delta by default
                 lazy_delta = attr.ib(default=True)
                 # trust the base of incoming delta by default
                 lazy_delta_base = attr.ib(default=False)
             class revlog:
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 If checkambig, indexfile is opened with checkambig=True at
                 writing, to avoid file stat ambiguity.
                 If mmaplargeindex is True, and an mmapindexthreshold is set, the
                 index will be mmapped rather than read if it is larger than the
                 configured threshold.
                 If censorable is True, the revlog can have censored revisions.
                 If `upperboundcomp` is not None, this is the expected maximal gain from
                 compression for the data content.
                 `concurrencychecker` is an optional function that receives 3 arguments: a
                 file handle, a filename, and an expected position. It should check whether
                 the current position in the file handle is valid, and log/warn/fail (by
                 raising).
                 See mercurial/revlogutils/contants.py for details about the content of an
                 index entry.
                 """
                 _flagserrorclass = error.RevlogError
                 @staticmethod
                 def is_inline_index(header_bytes):
                     """Determine if a revlog is inline from the initial bytes of the index"""
                     header = INDEX_HEADER.unpack(header_bytes)[0]
                     _format_flags = header & ~0xFFFF
                     _format_version = header & 0xFFFF
                     features = FEATURES_BY_VERSION[_format_version]
                     return features[b'inline'](_format_flags)
                 def __init__(
                     self,
                     opener,
                     target,
                     radix,
                     postfix=None,  # only exist for `tmpcensored` now
                     checkambig=False,
                     mmaplargeindex=False,
                     censorable=False,
                     upperboundcomp=None,
                     persistentnodemap=False,
                     concurrencychecker=None,
                     trypending=False,
                     try_split=False,
                     canonical_parent_order=True,
                 ):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     `target`: a (KIND, ID) tuple that identify the content stored in
                     this revlog. It help the rest of the code to understand what the revlog
                     is about without having to resort to heuristic and index filename
                     analysis. Note: that this must be reliably be set by normal code, but
                     that test, debug, or performance measurement code might not set this to
                     accurate value.
                     """
                     self.upperboundcomp = upperboundcomp
                     self.radix = radix
                     self._docket_file = None
                     self._indexfile = None
                     self._datafile = None
                     self._sidedatafile = None
                     self._nodemap_file = None
                     self.postfix = postfix
                     self._trypending = trypending
                     self._try_split = try_split
                     self.opener = opener
                     if persistentnodemap:
                         self._nodemap_file = nodemaputil.get_nodemap_file(self)
                     assert target[0] in ALL_KINDS
                     assert len(target) == 2
                     self.target = target
                     if b'feature-config' in self.opener.options:
                         self.feature_config = self.opener.options[b'feature-config'].copy()
                     else:
                         self.feature_config = FeatureConfig()
                     self.feature_config.censorable = censorable
                     self.feature_config.canonical_parent_order = canonical_parent_order
                     if b'data-config' in self.opener.options:
                         self.data_config = self.opener.options[b'data-config'].copy()
                     else:
                         self.data_config = DataConfig()
                     self.data_config.check_ambig = checkambig
                     self.data_config.mmap_large_index = mmaplargeindex
                     if b'delta-config' in self.opener.options:
                         self.delta_config = self.opener.options[b'delta-config'].copy()
                     else:
                         self.delta_config = DeltaConfig()
                     # 3-tuple of (node, rev, text) for a raw revision.
                     self._revisioncache = None
                     # Maps rev to chain base rev.
                     self._chainbasecache = util.lrucachedict(100)
                     # 2-tuple of (offset, data) of raw data from the revlog at an offset.
                     self._chunkcache = (0, b'')
                     self.index = None
                     self._docket = None
                     self._nodemap_docket = None
                     # Mapping of partial identifiers to full nodes.
                     self._pcache = {}
                     # other optionnals features
                     # Make copy of flag processors so each revlog instance can support
                     # custom flags.
                     self._flagprocessors = dict(flagutil.flagprocessors)
                     # 3-tuple of file handles being used for active writing.
                     self._writinghandles = None
                     # prevent nesting of addgroup
                     self._adding_group = None
                     self._loadindex()
                     self._concurrencychecker = concurrencychecker
                 @property
                 def _generaldelta(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.general_delta", b"6.6", stacklevel=2
                     )
                     return self.delta_config.general_delta
                 @property
                 def _checkambig(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.data_config.checkambig", b"6.6", stacklevel=2
                     )
                     return self.data_config.check_ambig
                 @property
                 def _mmaplargeindex(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.data_config.mmap_large_index", b"6.6", stacklevel=2
                     )
                     return self.data_config.mmap_large_index
                 @property
                 def _censorable(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.feature_config.censorable", b"6.6", stacklevel=2
                     )
                     return self.feature_config.censorable
                 @property
                 def _chunkcachesize(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.data_config.chunk_cache_size", b"6.6", stacklevel=2
                     )
                     return self.data_config.chunk_cache_size
                 @property
                 def _maxchainlen(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.max_chain_len", b"6.6", stacklevel=2
                     )
                     return self.delta_config.max_chain_len
                 @property
                 def _deltabothparents(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.delta_both_parents", b"6.6", stacklevel=2
                     )
                     return self.delta_config.delta_both_parents
                 @property
                 def _candidate_group_chunk_size(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.candidate_group_chunk_size",
                         b"6.6",
                         stacklevel=2,
                     )
                     return self.delta_config.candidate_group_chunk_size
                 @property
                 def _debug_delta(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.debug_delta", b"6.6", stacklevel=2
                     )
                     return self.delta_config.debug_delta
                 @property
                 def _compengine(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.feature_config.compression_engine",
                         b"6.6",
                         stacklevel=2,
                     )
                     return self.feature_config.compression_engine
                 @property
                 def _compengineopts(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.feature_config.compression_engine_options",
                         b"6.6",
                         stacklevel=2,
                     )
                     return self.feature_config.compression_engine_options
                 @property
                 def _maxdeltachainspan(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.max_deltachain_span", b"6.6", stacklevel=2
                     )
                     return self.delta_config.max_deltachain_span
                 @property
                 def _withsparseread(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.data_config.with_sparse_read", b"6.6", stacklevel=2
                     )
                     return self.data_config.with_sparse_read
                 @property
                 def _sparserevlog(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.sparse_revlog", b"6.6", stacklevel=2
                     )
                     return self.delta_config.sparse_revlog
                 @property
                 def hassidedata(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.feature_config.has_side_data", b"6.6", stacklevel=2
                     )
                     return self.feature_config.has_side_data
                 @property
                 def _srdensitythreshold(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.data_config.sr_density_threshold",
                         b"6.6",
                         stacklevel=2,
                     )
                     return self.data_config.sr_density_threshold
                 @property
                 def _srmingapsize(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.data_config.sr_min_gap_size", b"6.6", stacklevel=2
                     )
                     return self.data_config.sr_min_gap_size
                 @property
                 def _compute_rank(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.feature_config.compute_rank", b"6.6", stacklevel=2
                     )
                     return self.feature_config.compute_rank
                 @property
                 def canonical_parent_order(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.feature_config.canonical_parent_order",
                         b"6.6",
                         stacklevel=2,
                     )
                     return self.feature_config.canonical_parent_order
                 @property
                 def _lazydelta(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.lazy_delta", b"6.6", stacklevel=2
                     )
                     return self.delta_config.lazy_delta
                 @property
                 def _lazydeltabase(self):
                     """temporary compatibility proxy"""
                     util.nouideprecwarn(
                         b"use revlog.delta_config.lazy_delta_base", b"6.6", stacklevel=2
                     )
                     return self.delta_config.lazy_delta_base
                 def _init_opts(self):
                     """process options (from above/config) to setup associated default revlog mode
                     These values might be affected when actually reading on disk information.
                     The relevant values are returned for use in _loadindex().
                     * newversionflags:
                         version header to use if we need to create a new revlog
                     * mmapindexthreshold:
                         minimal index size for start to use mmap
                     * force_nodemap:
                         force the usage of a "development" version of the nodemap code
                     """
                     opts = self.opener.options
                     if b'changelogv2' in opts and self.revlog_kind == KIND_CHANGELOG:
                         new_header = CHANGELOGV2
                         compute_rank = opts.get(b'changelogv2.compute-rank', True)
                         self.feature_config.compute_rank = compute_rank
                     elif b'revlogv2' in opts:
                         new_header = REVLOGV2
                     elif b'revlogv1' in opts:
                         new_header = REVLOGV1 | FLAG_INLINE_DATA
                         if b'generaldelta' in opts:
                             new_header |= FLAG_GENERALDELTA
                     elif b'revlogv0' in self.opener.options:
                         new_header = REVLOGV0
                     else:
                         new_header = REVLOG_DEFAULT_VERSION
                     mmapindexthreshold = None
                     if self.data_config.mmap_large_index:
                         mmapindexthreshold = self.data_config.mmap_index_threshold
                     if self.feature_config.enable_ellipsis:
                         self._flagprocessors[REVIDX_ELLIPSIS] = ellipsisprocessor
                     # revlog v0 doesn't have flag processors
                     for flag, processor in opts.get(b'flagprocessors', {}).items():
                         flagutil.insertflagprocessor(flag, processor, self._flagprocessors)
                     chunk_cache_size = self.data_config.chunk_cache_size
                     if chunk_cache_size <= 0:
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not greater than 0')
                             % chunk_cache_size
                         )
                     elif chunk_cache_size & (chunk_cache_size - 1):
                         raise error.RevlogError(
                             _(b'revlog chunk cache size %r is not a power of 2')
                             % chunk_cache_size
                         )
                     force_nodemap = opts.get(b'devel-force-nodemap', False)
                     return new_header, mmapindexthreshold, force_nodemap
                 def _get_data(self, filepath, mmap_threshold, size=None):
                     """return a file content with or without mmap
                     If the file is missing return the empty string"""
                     try:
                         with self.opener(filepath) as fp:
                             if mmap_threshold is not None:
                                 file_size = self.opener.fstat(fp).st_size
                                 if file_size >= mmap_threshold:
                                     if size is not None:
                                         # avoid potentiel mmap crash
                                         size = min(file_size, size)
                                     # TODO: should .close() to release resources without
                                     # relying on Python GC
                                     if size is None:
                                         return util.buffer(util.mmapread(fp))
                                     else:
                                         return util.buffer(util.mmapread(fp, size))
                             if size is None:
                                 return fp.read()
                             else:
                                 return fp.read(size)
                     except FileNotFoundError:
                         return b''
                 def get_streams(self, max_linkrev, force_inline=False):
                     """return a list of streams that represent this revlog
                     This is used by stream-clone to do bytes to bytes copies of a repository.
                     This streams data for all revisions that refer to a changelog revision up
                     to `max_linkrev`.
                     If `force_inline` is set, it enforces that the stream will represent an inline revlog.
                     It returns is a list of three-tuple:
                         [
                             (filename, bytes_stream, stream_size),
                             …
                         ]
                     """
                     n = len(self)
                     index = self.index
                     while n > 0:
                         linkrev = index[n - 1][4]
                         if linkrev < max_linkrev:
                             break
                         # note: this loop will rarely go through multiple iterations, since
                         # it only traverses commits created during the current streaming
                         # pull operation.
                         #
                         # If this become a problem, using a binary search should cap the
                         # runtime of this.
                         n = n - 1
                     if n == 0:
                         # no data to send
                         return []
                     index_size = n * index.entry_size
                     data_size = self.end(n - 1)
                     # XXX we might have been split (or stripped) since the object
                     # initialization, We need to close this race too, but having a way to
                     # pre-open the file we feed to the revlog and never closing them before
                     # we are done streaming.
                     if self._inline:
                         def get_stream():
                             with self._indexfp() as fp:
                                 yield None
                                 size = index_size + data_size
                                 if size <= 65536:
                                     yield fp.read(size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=size)
                         inline_stream = get_stream()
                         next(inline_stream)
                         return [
                             (self._indexfile, inline_stream, index_size + data_size),
                         ]
                     elif force_inline:
                         def get_stream():
                             with self.reading():
                                 yield None
                                 for rev in range(n):
                                     idx = self.index.entry_binary(rev)
                                     if rev == 0 and self._docket is None:
                                         # re-inject the inline flag
                                         header = self._format_flags
                                         header |= self._format_version
                                         header |= FLAG_INLINE_DATA
                                         header = self.index.pack_header(header)
                                         idx = header + idx
                                     yield idx
                                     yield self._getsegmentforrevs(rev, rev)[1]
                         inline_stream = get_stream()
                         next(inline_stream)
                         return [
                             (self._indexfile, inline_stream, index_size + data_size),
                         ]
                     else:
                         def get_index_stream():
                             with self._indexfp() as fp:
                                 yield None
                                 if index_size <= 65536:
                                     yield fp.read(index_size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=index_size)
                         def get_data_stream():
                             with self._datafp() as fp:
                                 yield None
                                 if data_size <= 65536:
                                     yield fp.read(data_size)
                                 else:
                                     yield from util.filechunkiter(fp, limit=data_size)
                         index_stream = get_index_stream()
                         next(index_stream)
                         data_stream = get_data_stream()
                         next(data_stream)
                         return [
                             (self._datafile, data_stream, data_size),
                             (self._indexfile, index_stream, index_size),
                         ]
                 def _loadindex(self, docket=None):
                     new_header, mmapindexthreshold, force_nodemap = self._init_opts()
                     if self.postfix is not None:
                         entry_point = b'%s.i.%s' % (self.radix, self.postfix)
                     elif self._trypending and self.opener.exists(b'%s.i.a' % self.radix):
                         entry_point = b'%s.i.a' % self.radix
                     elif self._try_split and self.opener.exists(self._split_index_file):
                         entry_point = self._split_index_file
                     else:
                         entry_point = b'%s.i' % self.radix
                     if docket is not None:
                         self._docket = docket
                         self._docket_file = entry_point
                     else:
                         self._initempty = True
                         entry_data = self._get_data(entry_point, mmapindexthreshold)
                         if len(entry_data) > 0:
                             header = INDEX_HEADER.unpack(entry_data[:4])[0]
                             self._initempty = False
                         else:
                             header = new_header
                         self._format_flags = header & ~0xFFFF
                         self._format_version = header & 0xFFFF
                         supported_flags = SUPPORTED_FLAGS.get(self._format_version)
                         if supported_flags is None:
                             msg = _(b'unknown version (%d) in revlog %s')
                             msg %= (self._format_version, self.display_id)
                             raise error.RevlogError(msg)
                         elif self._format_flags & ~supported_flags:
                             msg = _(b'unknown flags (%#04x) in version %d revlog %s')
                             display_flag = self._format_flags >> 16
                             msg %= (display_flag, self._format_version, self.display_id)
                             raise error.RevlogError(msg)
                         features = FEATURES_BY_VERSION[self._format_version]
                         self._inline = features[b'inline'](self._format_flags)
                         self.delta_config.general_delta = features[b'generaldelta'](
                             self._format_flags
                         )
                         self.feature_config.has_side_data = features[b'sidedata']
                         if not features[b'docket']:
                             self._indexfile = entry_point
                             index_data = entry_data
                         else:
                             self._docket_file = entry_point
                             if self._initempty:
                                 self._docket = docketutil.default_docket(self, header)
                             else:
                                 self._docket = docketutil.parse_docket(
                                     self, entry_data, use_pending=self._trypending
                                 )
                     if self._docket is not None:
                         self._indexfile = self._docket.index_filepath()
                         index_data = b''
                         index_size = self._docket.index_end
                         if index_size > 0:
                             index_data = self._get_data(
                                 self._indexfile, mmapindexthreshold, size=index_size
                             )
                             if len(index_data) < index_size:
                                 msg = _(b'too few index data for %s: got %d, expected %d')
                                 msg %= (self.display_id, len(index_data), index_size)
                                 raise error.RevlogError(msg)
                         self._inline = False
                         # generaldelta implied by version 2 revlogs.
                         self.delta_config.general_delta = True
                         # the logic for persistent nodemap will be dealt with within the
                         # main docket, so disable it for now.
                         self._nodemap_file = None
                     if self._docket is not None:
                         self._datafile = self._docket.data_filepath()
                         self._sidedatafile = self._docket.sidedata_filepath()
                     elif self.postfix is None:
                         self._datafile = b'%s.d' % self.radix
                     else:
                         self._datafile = b'%s.d.%s' % (self.radix, self.postfix)
                     self.nodeconstants = sha1nodeconstants
                     self.nullid = self.nodeconstants.nullid
                     # sparse-revlog can't be on without general-delta (issue6056)
                     if not self.delta_config.general_delta:
                         self.delta_config.sparse_revlog = False
                     self._storedeltachains = True
                     devel_nodemap = (
                         self._nodemap_file
                         and force_nodemap
                         and parse_index_v1_nodemap is not None
                     )
                     use_rust_index = False
                     if rustrevlog is not None:
                         if self._nodemap_file is not None:
                             use_rust_index = True
                         else:
                             use_rust_index = self.opener.options.get(b'rust.index')
                     self._parse_index = parse_index_v1
                     if self._format_version == REVLOGV0:
                         self._parse_index = revlogv0.parse_index_v0
                     elif self._format_version == REVLOGV2:
                         self._parse_index = parse_index_v2
                     elif self._format_version == CHANGELOGV2:
                         self._parse_index = parse_index_cl_v2
                     elif devel_nodemap:
                         self._parse_index = parse_index_v1_nodemap
                     elif use_rust_index:
                         self._parse_index = parse_index_v1_mixed
                     try:
                         d = self._parse_index(index_data, self._inline)
                         index, chunkcache = d
                         use_nodemap = (
                             not self._inline
                             and self._nodemap_file is not None
                             and hasattr(index, 'update_nodemap_data')
                         )
                         if use_nodemap:
                             nodemap_data = nodemaputil.persisted_data(self)
                             if nodemap_data is not None:
                                 docket = nodemap_data[0]
                                 if (
                                     len(d[0]) > docket.tip_rev
                                     and d[0][docket.tip_rev][7] == docket.tip_node
                                 ):
                                     # no changelog tampering
                                     self._nodemap_docket = docket
                                     index.update_nodemap_data(*nodemap_data)
                     except (ValueError, IndexError):
                         raise error.RevlogError(
                             _(b"index %s is corrupted") % self.display_id
                         )
                     self.index = index
                     self._segmentfile = randomaccessfile.randomaccessfile(
                         self.opener,
                         (self._indexfile if self._inline else self._datafile),
                         self.data_config.chunk_cache_size,
                         chunkcache,
                     )
                     self._segmentfile_sidedata = randomaccessfile.randomaccessfile(
                         self.opener,
                         self._sidedatafile,
                         self.data_config.chunk_cache_size,
                     )
                     # revnum -> (chain-length, sum-delta-length)
                     self._chaininfocache = util.lrucachedict(500)
                     # revlog header -> revlog compressor
                     self._decompressors = {}
                 def get_revlog(self):
                     """simple function to mirror API of other not-really-revlog API"""
                     return self
                 @util.propertycache
                 def revlog_kind(self):
                     return self.target[0]
                 @util.propertycache
                 def display_id(self):
                     """The public facing "ID" of the revlog that we use in message"""
                     if self.revlog_kind == KIND_FILELOG:
                         # Reference the file without the "data/" prefix, so it is familiar
                         # to the user.
                         return self.target[1]
                     else:
                         return self.radix
                 def _get_decompressor(self, t):
                     try:
                         compressor = self._decompressors[t]
                     except KeyError:
                         try:
                             engine = util.compengines.forrevlogheader(t)
                             compressor = engine.revlogcompressor(
                                 self.feature_config.compression_engine_options
                             )
                             self._decompressors[t] = compressor
                         except KeyError:
                             raise error.RevlogError(
                                 _(b'unknown compression type %s') % binascii.hexlify(t)
                             )
                     return compressor
                 @util.propertycache
                 def _compressor(self):
                     engine = util.compengines[self.feature_config.compression_engine]
                     return engine.revlogcompressor(
                         self.feature_config.compression_engine_options
                     )
                 @util.propertycache
                 def _decompressor(self):
                     """the default decompressor"""
                     if self._docket is None:
                         return None
                     t = self._docket.default_compression_header
                     c = self._get_decompressor(t)
                     return c.decompress
                 def _indexfp(self):
                     """file object for the revlog's index file"""
                     return self.opener(self._indexfile, mode=b"r")
                 def __index_write_fp(self):
                     # You should not use this directly and use `_writing` instead
                     try:
                         f = self.opener(
                             self._indexfile,
                             mode=b"r+",
                             checkambig=self.data_config.check_ambig,
                         )
                         if self._docket is None:
                             f.seek(0, os.SEEK_END)
                         else:
                             f.seek(self._docket.index_end, os.SEEK_SET)
                         return f
                     except FileNotFoundError:
                         return self.opener(
                             self._indexfile,
                             mode=b"w+",
                             checkambig=self.data_config.check_ambig,
                         )
                 def __index_new_fp(self):
                     # You should not use this unless you are upgrading from inline revlog
                     return self.opener(
                         self._indexfile,
                         mode=b"w",
                         checkambig=self.data_config.check_ambig,
                         atomictemp=True,
                     )
                 def _datafp(self, mode=b'r'):
                     """file object for the revlog's data file"""
                     return self.opener(self._datafile, mode=mode)
                 @contextlib.contextmanager
                 def _sidedatareadfp(self):
                     """file object suitable to read sidedata"""
                     if self._writinghandles:
                         yield self._writinghandles[2]
                     else:
                         with self.opener(self._sidedatafile) as fp:
                             yield fp
                 def tiprev(self):
                     return len(self.index) - 1
                 def tip(self):
                     return self.node(self.tiprev())
                 def __contains__(self, rev):
                     return 0 <= rev < len(self)
                 def __len__(self):
                     return len(self.index)
                 def __iter__(self):
                     return iter(range(len(self)))
                 def revs(self, start=0, stop=None):
                     """iterate over all rev in this revlog (from start to stop)"""
                     return storageutil.iterrevs(len(self), start=start, stop=stop)
                 def hasnode(self, node):
                     try:
                         self.rev(node)
                         return True
                     except KeyError:
                         return False
                 def _candelta(self, baserev, rev):
                     """whether two revisions (baserev, rev) can be delta-ed or not"""
                     # Disable delta if either rev requires a content-changing flag
                     # processor (ex. LFS). This is because such flag processor can alter
                     # the rawtext content that the delta will be based on, and two clients
                     # could have a same revlog node with different flags (i.e. different
                     # rawtext contents) and the delta could be incompatible.
                     if (self.flags(baserev) & REVIDX_RAWTEXT_CHANGING_FLAGS) or (
                         self.flags(rev) & REVIDX_RAWTEXT_CHANGING_FLAGS
                     ):
                         return False
                     return True
                 def update_caches(self, transaction):
                     """update on disk cache
                     If a transaction is passed, the update may be delayed to transaction
                     commit."""
                     if self._nodemap_file is not None:
                         if transaction is None:
                             nodemaputil.update_persistent_nodemap(self)
                         else:
                             nodemaputil.setup_persistent_nodemap(transaction, self)
                 def clearcaches(self):
                     """Clear in-memory caches"""
                     self._revisioncache = None
                     self._chainbasecache.clear()
                     self._segmentfile.clear_cache()
                     self._segmentfile_sidedata.clear_cache()
                     self._pcache = {}
                     self._nodemap_docket = None
                     self.index.clearcaches()
                     # The python code is the one responsible for validating the docket, we
                     # end up having to refresh it here.
                     use_nodemap = (
                         not self._inline
                         and self._nodemap_file is not None
                         and hasattr(self.index, 'update_nodemap_data')
                     )
                     if use_nodemap:
                         nodemap_data = nodemaputil.persisted_data(self)
                         if nodemap_data is not None:
                             self._nodemap_docket = nodemap_data[0]
                             self.index.update_nodemap_data(*nodemap_data)
                 def rev(self, node):
                     """return the revision number associated with a <nodeid>"""
                     try:
                         return self.index.rev(node)
                     except TypeError:
                         raise
                     except error.RevlogError:
                         # parsers.c radix tree lookup failed
                         if (
                             node == self.nodeconstants.wdirid
                             or node in self.nodeconstants.wdirfilenodeids
                         ):
                             raise error.WdirUnsupported
                         raise error.LookupError(node, self.display_id, _(b'no node'))
                 # Accessors for index entries.
                 # First tuple entry is 8 bytes. First 6 bytes are offset. Last 2 bytes
                 # are flags.
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def sidedata_cut_off(self, rev):
                     sd_cut_off = self.index[rev][8]
                     if sd_cut_off != 0:
                         return sd_cut_off
                     # This is some annoying dance, because entries without sidedata
                     # currently use 0 as their ofsset. (instead of previous-offset +
                     # previous-size)
                     #
                     # We should reconsider this sidedata → 0 sidata_offset policy.
                     # In the meantime, we need this.
                     while 0 <= rev:
                         e = self.index[rev]
                         if e[9] != 0:
                             return e[8] + e[9]
                         rev -= 1
                     return 0
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def length(self, rev):
                     return self.index[rev][1]
                 def sidedata_length(self, rev):
                     if not self.feature_config.has_side_data:
                         return 0
                     return self.index[rev][9]
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.rawdata(rev)
                     return len(t)
                 def size(self, rev):
                     """length of non-raw text (processed by a "read" flag processor)"""
                     # fast path: if no "read" flag processor could change the content,
                     # size is rawsize. note: ELLIPSIS is known to not change the content.
                     flags = self.flags(rev)
                     if flags & (flagutil.REVIDX_KNOWN_FLAGS ^ REVIDX_ELLIPSIS) == 0:
                         return self.rawsize(rev)
                     return len(self.revision(rev))
                 def fast_rank(self, rev):
                     """Return the rank of a revision if already known, or None otherwise.
                     The rank of a revision is the size of the sub-graph it defines as a
                     head. Equivalently, the rank of a revision `r` is the size of the set
                     `ancestors(r)`, `r` included.
                     This method returns the rank retrieved from the revlog in constant
                     time. It makes no attempt at computing unknown values for versions of
                     the revlog which do not persist the rank.
                     """
                     rank = self.index[rev][ENTRY_RANK]
                     if self._format_version != CHANGELOGV2 or rank == RANK_UNKNOWN:
                         return None
                     if rev == nullrev:
                         return 0  # convention
                     return rank
                 def chainbase(self, rev):
                     base = self._chainbasecache.get(rev)
                     if base is not None:
                         return base
                     index = self.index
                     iterrev = rev
                     base = index[iterrev][3]
                     while base != iterrev:
                         iterrev = base
                         base = index[iterrev][3]
                     self._chainbasecache[rev] = base
                     return base
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parentrevs(self, rev):
                     try:
                         entry = self.index[rev]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                     if self.feature_config.canonical_parent_order and entry[5] == nullrev:
                         return entry[6], entry[5]
                     else:
                         return entry[5], entry[6]
                 # fast parentrevs(rev) where rev isn't filtered
                 _uncheckedparentrevs = parentrevs
                 def node(self, rev):
                     try:
                         return self.index[rev][7]
                     except IndexError:
                         if rev == wdirrev:
                             raise error.WdirUnsupported
                         raise
                 # Derived from index values.
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     # inline node() to avoid function call overhead
                     if self.feature_config.canonical_parent_order and d[5] == self.nullid:
                         return i[d[6]][7], i[d[5]][7]
                     else:
                         return i[d[5]][7], i[d[6]][7]
                 def chainlen(self, rev):
                     return self._chaininfo(rev)[0]
                 def _chaininfo(self, rev):
                     chaininfocache = self._chaininfocache
                     if rev in chaininfocache:
                         return chaininfocache[rev]
                     index = self.index
                     generaldelta = self.delta_config.general_delta
                     iterrev = rev
                     e = index[iterrev]
                     clen = 0
                     compresseddeltalen = 0
                     while iterrev != e[3]:
                         clen += 1
                         compresseddeltalen += e[1]
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         if iterrev in chaininfocache:
                             t = chaininfocache[iterrev]
                             clen += t[0]
                             compresseddeltalen += t[1]
                             break
                         e = index[iterrev]
                     else:
                         # Add text length of base since decompressing that also takes
                         # work. For cache hits the length is already included.
                         compresseddeltalen += e[1]
                     r = (clen, compresseddeltalen)
                     chaininfocache[rev] = r
                     return r
                 def _deltachain(self, rev, stoprev=None):
                     """Obtain the delta chain for a revision.
                     ``stoprev`` specifies a revision to stop at. If not specified, we
                     stop at the base of the chain.
                     Returns a 2-tuple of (chain, stopped) where ``chain`` is a list of
                     revs in ascending order and ``stopped`` is a bool indicating whether
                     ``stoprev`` was hit.
                     """
                     generaldelta = self.delta_config.general_delta
                     # Try C implementation.
                     try:
                         return self.index.deltachain(rev, stoprev, generaldelta)
                     except AttributeError:
                         pass
                     chain = []
                     # Alias to prevent attribute lookup in tight loop.
                     index = self.index
                     iterrev = rev
                     e = index[iterrev]
                     while iterrev != e[3] and iterrev != stoprev:
                         chain.append(iterrev)
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         e = index[iterrev]
                     if iterrev == stoprev:
                         stopped = True
                     else:
                         chain.append(iterrev)
                         stopped = False
                     chain.reverse()
                     return chain, stopped
                 def ancestors(self, revs, stoprev=0, inclusive=False):
                     """Generate the ancestors of 'revs' in reverse revision order.
                     Does not generate revs lower than stoprev.
                     See the documentation for ancestor.lazyancestors for more details."""
                     # first, make sure start revisions aren't filtered
                     revs = list(revs)
                     checkrev = self.node
                     for r in revs:
                         checkrev(r)
                     # and we're sure ancestors aren't filtered as well
                     if rustancestor is not None and self.index.rust_ext_compat:
                         lazyancestors = rustancestor.LazyAncestors
                         arg = self.index
                     else:
                         lazyancestors = ancestor.lazyancestors
                         arg = self._uncheckedparentrevs
                     return lazyancestors(arg, revs, stoprev=stoprev, inclusive=inclusive)
                 def descendants(self, revs):
                     return dagop.descendantrevs(revs, self.revs, self.parentrevs)
                 def findcommonmissing(self, common=None, heads=None):
                     """Return a tuple of the ancestors of common and the ancestors of heads
                     that are not ancestors of common. In revset terminology, we return the
                     tuple:
                       ::common, (::heads) - (::common)
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [self.nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     class lazyset:
                         def __init__(self, lazyvalues):
                             self.addedvalues = set()
                             self.lazyvalues = lazyvalues
                         def __contains__(self, value):
                             return value in self.addedvalues or value in self.lazyvalues
                         def __iter__(self):
                             added = self.addedvalues
                             for r in added:
                                 yield r
                             for r in self.lazyvalues:
                                 if not r in added:
                                     yield r
                         def add(self, value):
                             self.addedvalues.add(value)
                         def update(self, values):
                             self.addedvalues.update(values)
                     has = lazyset(self.ancestors(common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = collections.deque(r for r in heads if r not in has)
                     while visit:
                         r = visit.popleft()
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return has, [self.node(miss) for miss in missing]
                 def incrementalmissingrevs(self, common=None):
                     """Return an object that can be used to incrementally compute the
                     revision numbers of the ancestors of arbitrary sets that are not
                     ancestors of common. This is an ancestor.incrementalmissingancestors
                     object.
                     'common' is a list of revision numbers. If common is not supplied, uses
                     nullrev.
                     """
                     if common is None:
                         common = [nullrev]
                     if rustancestor is not None and self.index.rust_ext_compat:
                         return rustancestor.MissingAncestors(self.index, common)
                     return ancestor.incrementalmissingancestors(self.parentrevs, common)
                 def findmissingrevs(self, common=None, heads=None):
                     """Return the revision numbers of the ancestors of heads that
                     are not ancestors of common.
                     More specifically, return a list of revision numbers corresponding to
                     nodes N such that every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of revision numbers.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullrev]
                     if heads is None:
                         heads = self.headrevs()
                     inc = self.incrementalmissingrevs(common=common)
                     return inc.missingancestors(heads)
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [self.nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     inc = self.incrementalmissingrevs(common=common)
                     return [self.node(r) for r in inc.missingancestors(heads)]
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [self.nullid]  # Everybody's a descendant of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return (
                             [self.node(r) for r in self],
                             [self.nullid],
                             list(self.heads()),
                         )
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, False)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == self.nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendant of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n)  # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update(
                                         [p for p in self.parents(n) if p != self.nullid]
                                     )
                                 elif n in heads:  # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [root for root in roots if root in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(root) for root in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [self.nullid]
                     # Transform our roots list into a set.
                     descendants = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendants.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descendants, empty parents will look like
                     # they're descendants.
                     for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):
                         n = self.node(r)
                         isdescendant = False
                         if lowestrev == nullrev:  # Everybody is a descendant of nullid
                             isdescendant = True
                         elif n in descendants:
                             # n is already a descendant
                             isdescendant = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendants before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendants, it's not a root.
                                 if (p[0] in descendants) or (p[1] in descendants):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendant if either of its parents are
                             # descendants.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendants) or (p[1] in descendants):
                                 descendants.add(n)
                                 isdescendant = True
                         if isdescendant and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendants and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = True
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = True
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [head for head, flag in heads.items() if flag]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def headrevs(self, revs=None):
                     if revs is None:
                         try:
                             return self.index.headrevs()
                         except AttributeError:
                             return self._headrevs()
                     if rustdagop is not None and self.index.rust_ext_compat:
                         return rustdagop.headrevs(self.index, revs)
                     return dagop.headrevs(revs, self._uncheckedparentrevs)
                 def computephases(self, roots):
                     return self.index.computephasesmapsets(roots)
                 def _headrevs(self):
                     count = len(self)
                     if not count:
                         return [nullrev]
                     # we won't iter over filtered rev so nobody is a head at start
                     ishead = [0] * (count + 1)
                     index = self.index
                     for r in self:
                         ishead[r] = 1  # I may be an head
                         e = index[r]
                         ishead[e[5]] = ishead[e[6]] = 0  # my parent are not
                     return [r for r, val in enumerate(ishead) if val]
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         if not len(self):
                             return [self.nullid]
                         return [self.node(r) for r in self.headrevs()]
                     if start is None:
                         start = nullrev
                     else:
                         start = self.rev(start)
                     stoprevs = {self.rev(n) for n in stop or []}
                     revs = dagop.headrevssubset(
                         self.revs, self.parentrevs, startrev=start, stoprevs=stoprevs
                     )
                     return [self.node(rev) for rev in revs]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in self.revs(start=p + 1):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def commonancestorsheads(self, a, b):
                     """calculate all the heads of the common ancestors of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     ancs = self._commonancestorsheads(a, b)
                     return pycompat.maplist(self.node, ancs)
                 def _commonancestorsheads(self, *revs):
                     """calculate all the heads of the common ancestors of revs"""
                     try:
                         ancs = self.index.commonancestorsheads(*revs)
                     except (AttributeError, OverflowError):  # C implementation failed
                         ancs = ancestor.commonancestorsheads(self.parentrevs, *revs)
                     return ancs
                 def isancestor(self, a, b):
                     """return True if node a is an ancestor of node b
                     A revision is considered an ancestor of itself."""
                     a, b = self.rev(a), self.rev(b)
                     return self.isancestorrev(a, b)
                 def isancestorrev(self, a, b):
                     """return True if revision a is an ancestor of revision b
                     A revision is considered an ancestor of itself.
                     The implementation of this is trivial but the use of
                     reachableroots is not."""
                     if a == nullrev:
                         return True
                     elif a == b:
                         return True
                     elif a > b:
                         return False
                     return bool(self.reachableroots(a, [b], [a], includepath=False))
                 def reachableroots(self, minroot, heads, roots, includepath=False):
                     """return (heads(::(<roots> and <roots>::<heads>)))
                     If includepath is True, return (<roots>::<heads>)."""
                     try:
                         return self.index.reachableroots2(
                             minroot, heads, roots, includepath
                         )
                     except AttributeError:
                         return dagop._reachablerootspure(
                             self.parentrevs, minroot, roots, heads, includepath
                         )
                 def ancestor(self, a, b):
                     """calculate the "best" common ancestor of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     try:
                         ancs = self.index.ancestors(a, b)
                     except (AttributeError, OverflowError):
                         ancs = ancestor.ancestors(self.parentrevs, a, b)
                     if ancs:
                         # choose a consistent winner when there's a tie
                         return min(map(self.node, ancs))
                     return self.nullid
                 def _match(self, id):
                     if isinstance(id, int):
                         # rev
                         return self.node(id)
                     if len(id) == self.nodeconstants.nodelen:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node)  # quick search the index
                             return node
                         except error.LookupError:
                             pass  # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if b"%d" % rev != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 2 * self.nodeconstants.nodelen:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (binascii.Error, error.LookupError):
                             pass
                 def _partialmatch(self, id):
                     # we don't care wdirfilenodeids as they should be always full hash
                     maybewdir = self.nodeconstants.wdirhex.startswith(id)
                     ambiguous = False
                     try:
                         partial = self.index.partialmatch(id)
                         if partial and self.hasnode(partial):
                             if maybewdir:
                                 # single 'ff...' match in radix tree, ambiguous with wdir
                                 ambiguous = True
                             else:
                                 return partial
                         elif maybewdir:
                             # no 'ff...' match in radix tree, wdir identified
                             raise error.WdirUnsupported
                         else:
                             return None
                     except error.RevlogError:
                         # parsers.c radix tree lookup gave multiple matches
                         # fast path: for unfiltered changelog, radix tree is accurate
                         if not getattr(self, 'filteredrevs', None):
                             ambiguous = True
                         # fall through to slow path that filters hidden revisions
                     except (AttributeError, ValueError):
                         # we are pure python, or key is not hex
                         pass
                     if ambiguous:
                         raise error.AmbiguousPrefixLookupError(
                             id, self.display_id, _(b'ambiguous identifier')
                         )
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) <= 40:
                         # hex(node)[:...]
                         l = len(id) // 2 * 2  # grab an even number of digits
                         try:
                             # we're dropping the last digit, so let's check that it's hex,
                             # to avoid the expensive computation below if it's not
                             if len(id) % 2 > 0:
                                 if not (id[-1] in hexdigits):
                                     return None
                             prefix = bin(id[:l])
                         except binascii.Error:
                             pass
                         else:
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [
                                 n for n in nl if hex(n).startswith(id) and self.hasnode(n)
                             ]
                             if self.nodeconstants.nullhex.startswith(id):
                                 nl.append(self.nullid)
                             if len(nl) > 0:
                                 if len(nl) == 1 and not maybewdir:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise error.AmbiguousPrefixLookupError(
                                     id, self.display_id, _(b'ambiguous identifier')
                                 )
                             if maybewdir:
                                 raise error.WdirUnsupported
                             return None
                 def lookup(self, id):
                     """locate a node based on:
                     - revision number or str(revision number)
                     - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise error.LookupError(id, self.display_id, _(b'no match found'))
                 def shortest(self, node, minlength=1):
                     """Find the shortest unambiguous prefix that matches node."""
                     def isvalid(prefix):
                         try:
                             matchednode = self._partialmatch(prefix)
                         except error.AmbiguousPrefixLookupError:
                             return False
                         except error.WdirUnsupported:
                             # single 'ff...' match
                             return True
                         if matchednode is None:
                             raise error.LookupError(node, self.display_id, _(b'no node'))
                         return True
                     def maybewdir(prefix):
                         return all(c == b'f' for c in pycompat.iterbytestr(prefix))
                     hexnode = hex(node)
                     def disambiguate(hexnode, minlength):
                         """Disambiguate against wdirid."""
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if not maybewdir(prefix):
                                 return prefix
                     if not getattr(self, 'filteredrevs', None):
                         try:
                             length = max(self.index.shortest(node), minlength)
                             return disambiguate(hexnode, length)
                         except error.RevlogError:
                             if node != self.nodeconstants.wdirid:
                                 raise error.LookupError(
                                     node, self.display_id, _(b'no node')
                                 )
                         except AttributeError:
                             # Fall through to pure code
                             pass
                     if node == self.nodeconstants.wdirid:
                         for length in range(minlength, len(hexnode) + 1):
                             prefix = hexnode[:length]
                             if isvalid(prefix):
                                 return prefix
                     for length in range(minlength, len(hexnode) + 1):
                         prefix = hexnode[:length]
                         if isvalid(prefix):
                             return disambiguate(hexnode, length)
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return storageutil.hashrevisionsha1(text, p1, p2) != node
                 def _getsegmentforrevs(self, startrev, endrev):
                     """Obtain a segment of raw data corresponding to a range of revisions.
                     Accepts the start and end revisions and an optional already-open
                     file handle to be used for reading. If the file handle is read, its
                     seek position will not be preserved.
                     Requests for data may be satisfied by a cache.
                     Returns a 2-tuple of (offset, data) for the requested range of
                     revisions. Offset is the integer offset from the beginning of the
                     revlog and data is a str or buffer of the raw byte data.
                     Callers will need to call ``self.start(rev)`` and ``self.length(rev)``
                     to determine where each revision's data begins and ends.
                     """
                     # Inlined self.start(startrev) & self.end(endrev) for perf reasons
                     # (functions are expensive).
                     index = self.index
                     istart = index[startrev]
                     start = int(istart[0] >> 16)
                     if startrev == endrev:
                         end = start + istart[1]
                     else:
                         iend = index[endrev]
                         end = int(iend[0] >> 16) + iend[1]
                     if self._inline:
                         start += (startrev + 1) * self.index.entry_size
                         end += (endrev + 1) * self.index.entry_size
                     length = end - start
                     return start, self._segmentfile.read_chunk(start, length)
                 def _chunk(self, rev):
                     """Obtain a single decompressed chunk for a revision.
                     Accepts an integer revision and an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will not
                     be preserved.
                     Returns a str holding uncompressed data for the requested revision.
                     """
                     compression_mode = self.index[rev][10]
                     data = self._getsegmentforrevs(rev, rev)[1]
                     if compression_mode == COMP_MODE_PLAIN:
                         return data
                     elif compression_mode == COMP_MODE_DEFAULT:
                         return self._decompressor(data)
                     elif compression_mode == COMP_MODE_INLINE:
                         return self.decompress(data)
                     else:
                         msg = b'unknown compression mode %d'
                         msg %= compression_mode
                         raise error.RevlogError(msg)
                 def _chunks(self, revs, targetsize=None):
                     """Obtain decompressed chunks for the specified revisions.
                     Accepts an iterable of numeric revisions that are assumed to be in
                     ascending order. Also accepts an optional already-open file handle
                     to be used for reading. If used, the seek position of the file will
                     not be preserved.
                     This function is similar to calling ``self._chunk()`` multiple times,
                     but is faster.
                     Returns a list with decompressed data for each requested revision.
                     """
                     if not revs:
                         return []
                     start = self.start
                     length = self.length
                     inline = self._inline
                     iosize = self.index.entry_size
                     buffer = util.buffer
                     l = []
                     ladd = l.append
                     if not self.data_config.with_sparse_read:
                         slicedchunks = (revs,)
                     else:
                         slicedchunks = deltautil.slicechunk(
                             self, revs, targetsize=targetsize
                         )
                     for revschunk in slicedchunks:
                         firstrev = revschunk[0]
                         # Skip trailing revisions with empty diff
                         for lastrev in revschunk[::-1]:
                             if length(lastrev) != 0:
                                 break
                         try:
                             offset, data = self._getsegmentforrevs(firstrev, lastrev)
                         except OverflowError:
                             # issue4215 - we can't cache a run of chunks greater than
                             # 2G on Windows
                             return [self._chunk(rev) for rev in revschunk]
                         decomp = self.decompress
                         # self._decompressor might be None, but will not be used in that case
                         def_decomp = self._decompressor
                         for rev in revschunk:
                             chunkstart = start(rev)
                             if inline:
                                 chunkstart += (rev + 1) * iosize
                             chunklength = length(rev)
                             comp_mode = self.index[rev][10]
                             c = buffer(data, chunkstart - offset, chunklength)
                             if comp_mode == COMP_MODE_PLAIN:
                                 ladd(c)
                             elif comp_mode == COMP_MODE_INLINE:
                                 ladd(decomp(c))
                             elif comp_mode == COMP_MODE_DEFAULT:
                                 ladd(def_decomp(c))
                             else:
                                 msg = b'unknown compression mode %d'
                                 msg %= comp_mode
                                 raise error.RevlogError(msg)
                     return l
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self.delta_config.general_delta:
                         return base
                     else:
                         return rev - 1
                 def issnapshot(self, rev):
                     """tells whether rev is a snapshot"""
                     if not self.delta_config.sparse_revlog:
                         return self.deltaparent(rev) == nullrev
                     elif hasattr(self.index, 'issnapshot'):
                         # directly assign the method to cache the testing and access
                         self.issnapshot = self.index.issnapshot
                         return self.issnapshot(rev)
                     if rev == nullrev:
                         return True
                     entry = self.index[rev]
                     base = entry[3]
                     if base == rev:
                         return True
                     if base == nullrev:
                         return True
                     p1 = entry[5]
                     while self.length(p1) == 0:
                         b = self.deltaparent(p1)
                         if b == p1:
                             break
                         p1 = b
                     p2 = entry[6]
                     while self.length(p2) == 0:
                         b = self.deltaparent(p2)
                         if b == p2:
                             break
                         p2 = b
                     if base == p1 or base == p2:
                         return False
                     return self.issnapshot(base)
                 def snapshotdepth(self, rev):
                     """number of snapshot in the chain before this one"""
                     if not self.issnapshot(rev):
                         raise error.ProgrammingError(b'revision %d not a snapshot')
                     return len(self._deltachain(rev)[0]) - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions
                     The delta calculated is in binary form and is intended to be written to
                     revlog data directly. So this function needs raw revision data.
                     """
                     if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                         return bytes(self._chunk(rev2))
                     return mdiff.textdiff(self.rawdata(rev1), self.rawdata(rev2))
                 def revision(self, nodeorrev):
                     """return an uncompressed revision of a given node or revision
                     number.
                     """
                     return self._revisiondata(nodeorrev)
                 def sidedata(self, nodeorrev):
                     """a map of extra data related to the changeset but not part of the hash
                     This function currently return a dictionary. However, more advanced
                     mapping object will likely be used in the future for a more
                     efficient/lazy code.
                     """
                     # deal with <nodeorrev> argument type
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                     else:
                         rev = self.rev(nodeorrev)
                     return self._sidedata(rev)
                 def _revisiondata(self, nodeorrev, raw=False):
                     # deal with <nodeorrev> argument type
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                         node = self.node(rev)
                     else:
                         node = nodeorrev
                         rev = None
                     # fast path the special `nullid` rev
                     if node == self.nullid:
                         return b""
                     # ``rawtext`` is the text as stored inside the revlog. Might be the
                     # revision or might need to be processed to retrieve the revision.
                     rev, rawtext, validated = self._rawtext(node, rev)
                     if raw and validated:
                         # if we don't want to process the raw text and that raw
                         # text is cached, we can exit early.
                         return rawtext
                     if rev is None:
                         rev = self.rev(node)
                     # the revlog's flag for this revision
                     # (usually alter its state or content)
                     flags = self.flags(rev)
                     if validated and flags == REVIDX_DEFAULT_FLAGS:
                         # no extra flags set, no flag processor runs, text = rawtext
                         return rawtext
                     if raw:
                         validatehash = flagutil.processflagsraw(self, rawtext, flags)
                         text = rawtext
                     else:
                         r = flagutil.processflagsread(self, rawtext, flags)
                         text, validatehash = r
                     if validatehash:
                         self.checkhash(text, node, rev=rev)
                     if not validated:
                         self._revisioncache = (node, rev, rawtext)
                     return text
                 def _rawtext(self, node, rev):
                     """return the possibly unvalidated rawtext for a revision
                     returns (rev, rawtext, validated)
                     """
                     # revision in the cache (could be useful to apply delta)
                     cachedrev = None
                     # An intermediate text to apply deltas to
                     basetext = None
                     # Check if we have the entry in cache
                     # The cache entry looks like (node, rev, rawtext)
                     if self._revisioncache:
                         if self._revisioncache[0] == node:
                             return (rev, self._revisioncache[2], True)
                         cachedrev = self._revisioncache[1]
                     if rev is None:
                         rev = self.rev(node)
                     chain, stopped = self._deltachain(rev, stoprev=cachedrev)
                     if stopped:
                         basetext = self._revisioncache[2]
                     # drop cache to save memory, the caller is expected to
                     # update self._revisioncache after validating the text
                     self._revisioncache = None
                     targetsize = None
                     rawsize = self.index[rev][2]
                     if 0 <= rawsize:
                         targetsize = 4 * rawsize
                     bins = self._chunks(chain, targetsize=targetsize)
                     if basetext is None:
                         basetext = bytes(bins[0])
                         bins = bins[1:]
                     rawtext = mdiff.patches(basetext, bins)
                     del basetext  # let us have a chance to free memory early
                     return (rev, rawtext, False)
                 def _sidedata(self, rev):
                     """Return the sidedata for a given revision number."""
                     index_entry = self.index[rev]
                     sidedata_offset = index_entry[8]
                     sidedata_size = index_entry[9]
                     if self._inline:
                         sidedata_offset += self.index.entry_size * (1 + rev)
                     if sidedata_size == 0:
                         return {}
                     if self._docket.sidedata_end < sidedata_offset + sidedata_size:
                         filename = self._sidedatafile
                         end = self._docket.sidedata_end
                         offset = sidedata_offset
                         length = sidedata_size
                         m = FILE_TOO_SHORT_MSG % (filename, length, offset, end)
                         raise error.RevlogError(m)
                     comp_segment = self._segmentfile_sidedata.read_chunk(
                         sidedata_offset, sidedata_size
                     )
                     comp = self.index[rev][11]
                     if comp == COMP_MODE_PLAIN:
                         segment = comp_segment
                     elif comp == COMP_MODE_DEFAULT:
                         segment = self._decompressor(comp_segment)
                     elif comp == COMP_MODE_INLINE:
                         segment = self.decompress(comp_segment)
                     else:
                         msg = b'unknown compression mode %d'
                         msg %= comp
                         raise error.RevlogError(msg)
                     sidedata = sidedatautil.deserialize_sidedata(segment)
                     return sidedata
                 def rawdata(self, nodeorrev):
                     """return an uncompressed raw data of a given node or revision number."""
                     return self._revisiondata(nodeorrev, raw=True)
                 def hash(self, text, p1, p2):
                     """Compute a node hash.
                     Available as a function so that subclasses can replace the hash
                     as needed.
                     """
                     return storageutil.hashrevisionsha1(text, p1, p2)
                 def checkhash(self, text, node, p1=None, p2=None, rev=None):
                     """Check node hash integrity.
                     Available as a function so that subclasses can extend hash mismatch
                     behaviors as needed.
                     """
                     try:
                         if p1 is None and p2 is None:
                             p1, p2 = self.parents(node)
                         if node != self.hash(text, p1, p2):
                             # Clear the revision cache on hash failure. The revision cache
                             # only stores the raw revision and clearing the cache does have
                             # the side-effect that we won't have a cache hit when the raw
                             # revision data is accessed. But this case should be rare and
                             # it is extra work to teach the cache about the hash
                             # verification state.
                             if self._revisioncache and self._revisioncache[0] == node:
                                 self._revisioncache = None
                             revornode = rev
                             if revornode is None:
                                 revornode = templatefilters.short(hex(node))
                             raise error.RevlogError(
                                 _(b"integrity check failed on %s:%s")
                                 % (self.display_id, pycompat.bytestr(revornode))
                             )
                     except error.RevlogError:
                         if self.feature_config.censorable and storageutil.iscensoredtext(
                             text
                         ):
                             raise error.CensoredNodeError(self.display_id, node, text)
                         raise
                 @property
                 def _split_index_file(self):
                     """the path where to expect the index of an ongoing splitting operation
                     The file will only exist if a splitting operation is in progress, but
                     it is always expected at the same location."""
                     parts = self.radix.split(b'/')
                     if len(parts) > 1:
                         # adds a '-s' prefix to the ``data/` or `meta/` base
                         head = parts[0] + b'-s'
                         mids = parts[1:-1]
                         tail = parts[-1] + b'.i'
                         pieces = [head] + mids + [tail]
                         return b'/'.join(pieces)
                     else:
                         # the revlog is stored at the root of the store (changelog or
                         # manifest), no risk of collision.
                         return self.radix + b'.i.s'
                 def _enforceinlinesize(self, tr, side_write=True):
                     """Check if the revlog is too big for inline and convert if so.
                     This should be called after revisions are added to the revlog. If the
                     revlog has grown too large to be an inline revlog, it will convert it
                     to use multiple index and data files.
                     """
                     tiprev = len(self) - 1
                     total_size = self.start(tiprev) + self.length(tiprev)
                     if not self._inline or total_size < _maxinline:
                         return
                     troffset = tr.findoffset(self._indexfile)
                     if troffset is None:
                         raise error.RevlogError(
                             _(b"%s not found in the transaction") % self._indexfile
                         )
                     if troffset:
                         tr.addbackup(self._indexfile, for_offset=True)
                     tr.add(self._datafile, 0)
                     existing_handles = False
                     if self._writinghandles is not None:
                         existing_handles = True
                         fp = self._writinghandles[0]
                         fp.flush()
                         fp.close()
                         # We can't use the cached file handle after close(). So prevent
                         # its usage.
                         self._writinghandles = None
                         self._segmentfile.writing_handle = None
                         # No need to deal with sidedata writing handle as it is only
                         # relevant with revlog-v2 which is never inline, not reaching
                         # this code
                     if side_write:
                         old_index_file_path = self._indexfile
                         new_index_file_path = self._split_index_file
                         opener = self.opener
                         weak_self = weakref.ref(self)
                         # the "split" index replace the real index when the transaction is finalized
                         def finalize_callback(tr):
                             opener.rename(
                                 new_index_file_path,
                                 old_index_file_path,
                                 checkambig=True,
                             )
                             maybe_self = weak_self()
                             if maybe_self is not None:
                                 maybe_self._indexfile = old_index_file_path
                         def abort_callback(tr):
                             maybe_self = weak_self()
                             if maybe_self is not None:
                                 maybe_self._indexfile = old_index_file_path
                         tr.registertmp(new_index_file_path)
                         if self.target[1] is not None:
                             callback_id = b'000-revlog-split-%d-%s' % self.target
                         else:
                             callback_id = b'000-revlog-split-%d' % self.target[0]
                         tr.addfinalize(callback_id, finalize_callback)
                         tr.addabort(callback_id, abort_callback)
                     new_dfh = self._datafp(b'w+')
                     new_dfh.truncate(0)  # drop any potentially existing data
                     try:
                         with self.reading():
                             for r in self:
                                 new_dfh.write(self._getsegmentforrevs(r, r)[1])
                             new_dfh.flush()
                         if side_write:
                             self._indexfile = new_index_file_path
                         with self.__index_new_fp() as fp:
                             self._format_flags &= ~FLAG_INLINE_DATA
                             self._inline = False
                             for i in self:
                                 e = self.index.entry_binary(i)
                                 if i == 0 and self._docket is None:
                                     header = self._format_flags | self._format_version
                                     header = self.index.pack_header(header)
                                     e = header + e
                                 fp.write(e)
                             if self._docket is not None:
                                 self._docket.index_end = fp.tell()
                             # If we don't use side-write, the temp file replace the real
                             # index when we exit the context manager
                         nodemaputil.setup_persistent_nodemap(tr, self)
                         self._segmentfile = randomaccessfile.randomaccessfile(
                             self.opener,
                             self._datafile,
                             self.data_config.chunk_cache_size,
                         )
                         if existing_handles:
                             # switched from inline to conventional reopen the index
                             ifh = self.__index_write_fp()
                             self._writinghandles = (ifh, new_dfh, None)
                             self._segmentfile.writing_handle = new_dfh
                             new_dfh = None
                             # No need to deal with sidedata writing handle as it is only
                             # relevant with revlog-v2 which is never inline, not reaching
                             # this code
                     finally:
                         if new_dfh is not None:
                             new_dfh.close()
                 def _nodeduplicatecallback(self, transaction, node):
                     """called when trying to add a node already stored."""
                 @contextlib.contextmanager
                 def reading(self):
                     """Context manager that keeps data and sidedata files open for reading"""
                     if len(self.index) == 0:
                         yield  # nothing to be read
                     else:
                         with self._segmentfile.reading():
                             with self._segmentfile_sidedata.reading():
                                 yield
                 @contextlib.contextmanager
                 def _writing(self, transaction):
                     if self._trypending:
                         msg = b'try to write in a `trypending` revlog: %s'
                         msg %= self.display_id
                         raise error.ProgrammingError(msg)
                     if self._writinghandles is not None:
                         yield
                     else:
                         ifh = dfh = sdfh = None
                         try:
                             r = len(self)
                             # opening the data file.
                             dsize = 0
                             if r:
                                 dsize = self.end(r - 1)
                             dfh = None
                             if not self._inline:
                                 try:
                                     dfh = self._datafp(b"r+")
                                     if self._docket is None:
                                         dfh.seek(0, os.SEEK_END)
                                     else:
                                         dfh.seek(self._docket.data_end, os.SEEK_SET)
                                 except FileNotFoundError:
                                     dfh = self._datafp(b"w+")
                                 transaction.add(self._datafile, dsize)
                             if self._sidedatafile is not None:
                                 # revlog-v2 does not inline, help Pytype
                                 assert dfh is not None
                                 try:
                                     sdfh = self.opener(self._sidedatafile, mode=b"r+")
                                     dfh.seek(self._docket.sidedata_end, os.SEEK_SET)
                                 except FileNotFoundError:
                                     sdfh = self.opener(self._sidedatafile, mode=b"w+")
                                 transaction.add(
                                     self._sidedatafile, self._docket.sidedata_end
                                 )
                             # opening the index file.
                             isize = r * self.index.entry_size
                             ifh = self.__index_write_fp()
                             if self._inline:
                                 transaction.add(self._indexfile, dsize + isize)
                             else:
                                 transaction.add(self._indexfile, isize)
                             # exposing all file handle for writing.
                             self._writinghandles = (ifh, dfh, sdfh)
                             self._segmentfile.writing_handle = ifh if self._inline else dfh
                             self._segmentfile_sidedata.writing_handle = sdfh
                             yield
                             if self._docket is not None:
                                 self._write_docket(transaction)
                         finally:
                             self._writinghandles = None
                             self._segmentfile.writing_handle = None
                             self._segmentfile_sidedata.writing_handle = None
                             if dfh is not None:
                                 dfh.close()
                             if sdfh is not None:
                                 sdfh.close()
                             # closing the index file last to avoid exposing referent to
                             # potential unflushed data content.
                             if ifh is not None:
                                 ifh.close()
                 def _write_docket(self, transaction):
                     """write the current docket on disk
                     Exist as a method to help changelog to implement transaction logic
                     We could also imagine using the same transaction logic for all revlog
                     since docket are cheap."""
                     self._docket.write(transaction)
                 def addrevision(
                     self,
                     text,
                     transaction,
                     link,
                     p1,
                     p2,
                     cachedelta=None,
                     node=None,
                     flags=REVIDX_DEFAULT_FLAGS,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     node - nodeid of revision; typically node is not specified, and it is
                         computed by default as hash(text, p1, p2), however subclasses might
                         use different hashing method (and override checkhash() in such case)
                     flags - the known flags to set on the revision
                     deltacomputer - an optional deltacomputer instance shared between
                         multiple calls
                     """
                     if link == nullrev:
                         raise error.RevlogError(
                             _(b"attempted to add linkrev -1 to %s") % self.display_id
                         )
                     if sidedata is None:
                         sidedata = {}
                     elif sidedata and not self.feature_config.has_side_data:
                         raise error.ProgrammingError(
                             _(b"trying to add sidedata to a revlog who don't support them")
                         )
                     if flags:
                         node = node or self.hash(text, p1, p2)
                     rawtext, validatehash = flagutil.processflagswrite(self, text, flags)
                     # If the flag processor modifies the revision data, ignore any provided
                     # cachedelta.
                     if rawtext != text:
                         cachedelta = None
                     if len(rawtext) > _maxentrysize:
                         raise error.RevlogError(
                             _(
                                 b"%s: size of %d bytes exceeds maximum revlog storage of 2GiB"
                             )
                             % (self.display_id, len(rawtext))
                         )
                     node = node or self.hash(rawtext, p1, p2)
                     rev = self.index.get_rev(node)
                     if rev is not None:
                         return rev
                     if validatehash:
                         self.checkhash(rawtext, node, p1=p1, p2=p2)
                     return self.addrawrevision(
                         rawtext,
                         transaction,
                         link,
                         p1,
                         p2,
                         node,
                         flags,
                         cachedelta=cachedelta,
                         deltacomputer=deltacomputer,
                         sidedata=sidedata,
                     )
                 def addrawrevision(
                     self,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     node,
                     flags,
                     cachedelta=None,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """add a raw revision with known flags, node and parents
                     useful when reusing a revision not stored in this revlog (ex: received
                     over wire, or read from an external bundle).
                     """
                     with self._writing(transaction):
                         return self._addrevision(
                             node,
                             rawtext,
                             transaction,
                             link,
                             p1,
                             p2,
                             flags,
                             cachedelta,
                             deltacomputer=deltacomputer,
                             sidedata=sidedata,
                         )
                 def compress(self, data):
                     """Generate a possibly-compressed representation of data."""
                     if not data:
                         return b'', data
                     compressed = self._compressor.compress(data)
                     if compressed:
                         # The revlog compressor added the header in the returned data.
                         return b'', compressed
                     if data[0:1] == b'\0':
                         return b'', data
                     return b'u', data
                 def decompress(self, data):
                     """Decompress a revlog chunk.
                     The chunk is expected to begin with a header identifying the
                     format type so it can be routed to an appropriate decompressor.
                     """
                     if not data:
                         return data
                     # Revlogs are read much more frequently than they are written and many
                     # chunks only take microseconds to decompress, so performance is
                     # important here.
                     #
                     # We can make a few assumptions about revlogs:
                     #
                     # 1) the majority of chunks will be compressed (as opposed to inline
                     #    raw data).
                     # 2) decompressing *any* data will likely by at least 10x slower than
                     #    returning raw inline data.
                     # 3) we want to prioritize common and officially supported compression
                     #    engines
                     #
                     # It follows that we want to optimize for "decompress compressed data
                     # when encoded with common and officially supported compression engines"
                     # case over "raw data" and "data encoded by less common or non-official
                     # compression engines." That is why we have the inline lookup first
                     # followed by the compengines lookup.
                     #
                     # According to `hg perfrevlogchunks`, this is ~0.5% faster for zlib
                     # compressed chunks. And this matters for changelog and manifest reads.
                     t = data[0:1]
                     if t == b'x':
                         try:
                             return _zlibdecompress(data)
                         except zlib.error as e:
                             raise error.RevlogError(
                                 _(b'revlog decompress error: %s')
                                 % stringutil.forcebytestr(e)
                             )
                     # '\0' is more common than 'u' so it goes first.
                     elif t == b'\0':
                         return data
                     elif t == b'u':
                         return util.buffer(data, 1)
                     compressor = self._get_decompressor(t)
                     return compressor.decompress(data)
                 def _addrevision(
                     self,
                     node,
                     rawtext,
                     transaction,
                     link,
                     p1,
                     p2,
                     flags,
                     cachedelta,
                     alwayscache=False,
                     deltacomputer=None,
                     sidedata=None,
                 ):
                     """internal function to add revisions to the log
                     see addrevision for argument descriptions.
                     note: "addrevision" takes non-raw text, "_addrevision" takes raw text.
                     if "deltacomputer" is not provided or None, a defaultdeltacomputer will
                     be used.
                     invariants:
                     - rawtext is optional (can be None); if not set, cachedelta must be set.
                       if both are set, they must correspond to each other.
                     """
                     if node == self.nullid:
                         raise error.RevlogError(
                             _(b"%s: attempt to add null revision") % self.display_id
                         )
                     if (
                         node == self.nodeconstants.wdirid
                         or node in self.nodeconstants.wdirfilenodeids
                     ):
                         raise error.RevlogError(
                             _(b"%s: attempt to add wdir revision") % self.display_id
                         )
                     if self._writinghandles is None:
                         msg = b'adding revision outside `revlog._writing` context'
                         raise error.ProgrammingError(msg)
                     btext = [rawtext]
                     curr = len(self)
                     prev = curr - 1
                     offset = self._get_data_offset(prev)
                     if self._concurrencychecker:
                         ifh, dfh, sdfh = self._writinghandles
                         # XXX no checking for the sidedata file
                         if self._inline:
                             # offset is "as if" it were in the .d file, so we need to add on
                             # the size of the entry metadata.
                             self._concurrencychecker(
                                 ifh, self._indexfile, offset + curr * self.index.entry_size
                             )
                         else:
                             # Entries in the .i are a consistent size.
                             self._concurrencychecker(
                                 ifh, self._indexfile, curr * self.index.entry_size
                             )
                             self._concurrencychecker(dfh, self._datafile, offset)
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if rawtext is None:
                         # need rawtext size, before changed by flag processors, which is
                         # the non-raw size. use revlog explicitly to avoid filelog's extra
                         # logic that might remove metadata size.
                         textlen = mdiff.patchedsize(
                             revlog.size(self, cachedelta[0]), cachedelta[1]
                         )
                     else:
                         textlen = len(rawtext)
                     if deltacomputer is None:
                         write_debug = None
                         if self.delta_config.debug_delta:
                             write_debug = transaction._report
                         deltacomputer = deltautil.deltacomputer(
                             self, write_debug=write_debug
                         )
                     if cachedelta is not None and len(cachedelta) == 2:
                         # If the cached delta has no information about how it should be
                         # reused, add the default reuse instruction according to the
                         # revlog's configuration.
                         if (
                             self.delta_config.general_delta
                             and self.delta_config.lazy_delta_base
                         ):
                             delta_base_reuse = DELTA_BASE_REUSE_TRY
                         else:
                             delta_base_reuse = DELTA_BASE_REUSE_NO
                         cachedelta = (cachedelta[0], cachedelta[1], delta_base_reuse)
                     revinfo = revlogutils.revisioninfo(
                         node,
                         p1,
                         p2,
                         btext,
                         textlen,
                         cachedelta,
                         flags,
                     )
                     deltainfo = deltacomputer.finddeltainfo(revinfo)
                     compression_mode = COMP_MODE_INLINE
                     if self._docket is not None:
                         default_comp = self._docket.default_compression_header
                         r = deltautil.delta_compression(default_comp, deltainfo)
                         compression_mode, deltainfo = r
                     sidedata_compression_mode = COMP_MODE_INLINE
                     if sidedata and self.feature_config.has_side_data:
                         sidedata_compression_mode = COMP_MODE_PLAIN
                         serialized_sidedata = sidedatautil.serialize_sidedata(sidedata)
                         sidedata_offset = self._docket.sidedata_end
                         h, comp_sidedata = self.compress(serialized_sidedata)
                         if (
                             h != b'u'
                             and comp_sidedata[0:1] != b'\0'
                             and len(comp_sidedata) < len(serialized_sidedata)
                         ):
                             assert not h
                             if (
                                 comp_sidedata[0:1]
                                 == self._docket.default_compression_header
                             ):
                                 sidedata_compression_mode = COMP_MODE_DEFAULT
                                 serialized_sidedata = comp_sidedata
                             else:
                                 sidedata_compression_mode = COMP_MODE_INLINE
                                 serialized_sidedata = comp_sidedata
                     else:
                         serialized_sidedata = b""
                         # Don't store the offset if the sidedata is empty, that way
                         # we can easily detect empty sidedata and they will be no different
                         # than ones we manually add.
                         sidedata_offset = 0
                     rank = RANK_UNKNOWN
                     if self.feature_config.compute_rank:
                         if (p1r, p2r) == (nullrev, nullrev):
                             rank = 1
                         elif p1r != nullrev and p2r == nullrev:
                             rank = 1 + self.fast_rank(p1r)
                         elif p1r == nullrev and p2r != nullrev:
                             rank = 1 + self.fast_rank(p2r)
                         else:  # merge node
                             if rustdagop is not None and self.index.rust_ext_compat:
                                 rank = rustdagop.rank(self.index, p1r, p2r)
                             else:
                                 pmin, pmax = sorted((p1r, p2r))
                                 rank = 1 + self.fast_rank(pmax)
                                 rank += sum(1 for _ in self.findmissingrevs([pmax], [pmin]))
                     e = revlogutils.entry(
                         flags=flags,
                         data_offset=offset,
                         data_compressed_length=deltainfo.deltalen,
                         data_uncompressed_length=textlen,
                         data_compression_mode=compression_mode,
                         data_delta_base=deltainfo.base,
                         link_rev=link,
                         parent_rev_1=p1r,
                         parent_rev_2=p2r,
                         node_id=node,
                         sidedata_offset=sidedata_offset,
                         sidedata_compressed_length=len(serialized_sidedata),
                         sidedata_compression_mode=sidedata_compression_mode,
                         rank=rank,
                     )
                     self.index.append(e)
                     entry = self.index.entry_binary(curr)
                     if curr == 0 and self._docket is None:
                         header = self._format_flags | self._format_version
                         header = self.index.pack_header(header)
                         entry = header + entry
                     self._writeentry(
                         transaction,
                         entry,
                         deltainfo.data,
                         link,
                         offset,
                         serialized_sidedata,
                         sidedata_offset,
                     )
                     rawtext = btext[0]
                     if alwayscache and rawtext is None:
                         rawtext = deltacomputer.buildtext(revinfo)
                     if type(rawtext) == bytes:  # only accept immutable objects
                         self._revisioncache = (node, curr, rawtext)
                     self._chainbasecache[curr] = deltainfo.chainbase
                     return curr
                 def _get_data_offset(self, prev):
                     """Returns the current offset in the (in-transaction) data file.
                     Versions < 2 of the revlog can get this 0(1), revlog v2 needs a docket
                     file to store that information: since sidedata can be rewritten to the
                     end of the data file within a transaction, you can have cases where, for
                     example, rev `n` does not have sidedata while rev `n - 1` does, leading
                     to `n - 1`'s sidedata being written after `n`'s data.
                     TODO cache this in a docket file before getting out of experimental."""
                     if self._docket is None:
                         return self.end(prev)
                     else:
                         return self._docket.data_end
                 def _writeentry(
                     self, transaction, entry, data, link, offset, sidedata, sidedata_offset
                 ):
                     # Files opened in a+ mode have inconsistent behavior on various
                     # platforms. Windows requires that a file positioning call be made
                     # when the file handle transitions between reads and writes. See
                     # 3686fa2b8eee and the mixedfilemodewrapper in windows.py. On other
                     # platforms, Python or the platform itself can be buggy. Some versions
                     # of Solaris have been observed to not append at the end of the file
                     # if the file was seeked to before the end. See issue4943 for more.
                     #
                     # We work around this issue by inserting a seek() before writing.
                     # Note: This is likely not necessary on Python 3. However, because
                     # the file handle is reused for reads and may be seeked there, we need
                     # to be careful before changing this.
                     if self._writinghandles is None:
                         msg = b'adding revision outside `revlog._writing` context'
                         raise error.ProgrammingError(msg)
                     ifh, dfh, sdfh = self._writinghandles
                     if self._docket is None:
                         ifh.seek(0, os.SEEK_END)
                     else:
                         ifh.seek(self._docket.index_end, os.SEEK_SET)
                     if dfh:
                         if self._docket is None:
                             dfh.seek(0, os.SEEK_END)
                         else:
                             dfh.seek(self._docket.data_end, os.SEEK_SET)
                     if sdfh:
                         sdfh.seek(self._docket.sidedata_end, os.SEEK_SET)
                     curr = len(self) - 1
                     if not self._inline:
                         transaction.add(self._datafile, offset)
                         if self._sidedatafile:
                             transaction.add(self._sidedatafile, sidedata_offset)
                         transaction.add(self._indexfile, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         if sidedata:
                             sdfh.write(sidedata)
                         ifh.write(entry)
                     else:
                         offset += curr * self.index.entry_size
                         transaction.add(self._indexfile, offset)
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                         assert not sidedata
                         self._enforceinlinesize(transaction)
                     if self._docket is not None:
                         # revlog-v2 always has 3 writing handles, help Pytype
                         wh1 = self._writinghandles[0]
                         wh2 = self._writinghandles[1]
                         wh3 = self._writinghandles[2]
                         assert wh1 is not None
                         assert wh2 is not None
                         assert wh3 is not None
                         self._docket.index_end = wh1.tell()
                         self._docket.data_end = wh2.tell()
                         self._docket.sidedata_end = wh3.tell()
                     nodemaputil.setup_persistent_nodemap(transaction, self)
                 def addgroup(
                     self,
                     deltas,
                     linkmapper,
                     transaction,
                     alwayscache=False,
                     addrevisioncb=None,
                     duplicaterevisioncb=None,
                     debug_info=None,
                     delta_base_reuse_policy=None,
                 ):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     If ``addrevisioncb`` is defined, it will be called with arguments of
                     this revlog and the node that was added.
                     """
                     if self._adding_group:
                         raise error.ProgrammingError(b'cannot nest addgroup() calls')
                     # read the default delta-base reuse policy from revlog config if the
                     # group did not specify one.
                     if delta_base_reuse_policy is None:
                         if (
                             self.delta_config.general_delta
                             and self.delta_config.lazy_delta_base
                         ):
                             delta_base_reuse_policy = DELTA_BASE_REUSE_TRY
                         else:
                             delta_base_reuse_policy = DELTA_BASE_REUSE_NO
                     self._adding_group = True
                     empty = True
                     try:
                         with self._writing(transaction):
                             write_debug = None
                             if self.delta_config.debug_delta:
                                 write_debug = transaction._report
                             deltacomputer = deltautil.deltacomputer(
                                 self,
                                 write_debug=write_debug,
                                 debug_info=debug_info,
                             )
                             # loop through our set of deltas
                             for data in deltas:
                                 (
                                     node,
                                     p1,
                                     p2,
                                     linknode,
                                     deltabase,
                                     delta,
                                     flags,
                                     sidedata,
                                 ) = data
                                 link = linkmapper(linknode)
                                 flags = flags or REVIDX_DEFAULT_FLAGS
                                 rev = self.index.get_rev(node)
                                 if rev is not None:
                                     # this can happen if two branches make the same change
                                     self._nodeduplicatecallback(transaction, rev)
                                     if duplicaterevisioncb:
                                         duplicaterevisioncb(self, rev)
                                     empty = False
                                     continue
                                 for p in (p1, p2):
                                     if not self.index.has_node(p):
                                         raise error.LookupError(
                                             p, self.radix, _(b'unknown parent')
                                         )
                                 if not self.index.has_node(deltabase):
                                     raise error.LookupError(
                                         deltabase, self.display_id, _(b'unknown delta base')
                                     )
                                 baserev = self.rev(deltabase)
                                 if baserev != nullrev and self.iscensored(baserev):
                                     # if base is censored, delta must be full replacement in a
                                     # single patch operation
                                     hlen = struct.calcsize(b">lll")
                                     oldlen = self.rawsize(baserev)
                                     newlen = len(delta) - hlen
                                     if delta[:hlen] != mdiff.replacediffheader(
                                         oldlen, newlen
                                     ):
                                         raise error.CensoredBaseError(
                                             self.display_id, self.node(baserev)
                                         )
                                 if not flags and self._peek_iscensored(baserev, delta):
                                     flags |= REVIDX_ISCENSORED
                                 # We assume consumers of addrevisioncb will want to retrieve
                                 # the added revision, which will require a call to
                                 # revision(). revision() will fast path if there is a cache
                                 # hit. So, we tell _addrevision() to always cache in this case.
                                 # We're only using addgroup() in the context of changegroup
                                 # generation so the revision data can always be handled as raw
                                 # by the flagprocessor.
                                 rev = self._addrevision(
                                     node,
                                     None,
                                     transaction,
                                     link,
                                     p1,
                                     p2,
                                     flags,
                                     (baserev, delta, delta_base_reuse_policy),
                                     alwayscache=alwayscache,
                                     deltacomputer=deltacomputer,
                                     sidedata=sidedata,
                                 )
                                 if addrevisioncb:
                                     addrevisioncb(self, rev)
                                 empty = False
                     finally:
                         self._adding_group = False
                     return not empty
                 def iscensored(self, rev):
                     """Check if a file revision is censored."""
                     if not self.feature_config.censorable:
                         return False
                     return self.flags(rev) & REVIDX_ISCENSORED
                 def _peek_iscensored(self, baserev, delta):
                     """Quickly check if a delta produces a censored revision."""
                     if not self.feature_config.censorable:
                         return False
                     return storageutil.deltaiscensored(delta, baserev, self.rawsize)
                 def getstrippoint(self, minlink):
                     """find the minimum rev that must be stripped to strip the linkrev
                     Returns a tuple containing the minimum rev and a set of all revs that
                     have linkrevs that will be broken by this strip.
                     """
                     return storageutil.resolvestripinfo(
                         minlink,
                         len(self) - 1,
                         self.headrevs(),
                         self.linkrev,
                         self.parentrevs,
                     )
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll re-add them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     rev, _ = self.getstrippoint(minlink)
                     if rev == len(self):
                         return
                     # first truncate the files on disk
                     data_end = self.start(rev)
                     if not self._inline:
                         transaction.add(self._datafile, data_end)
                         end = rev * self.index.entry_size
                     else:
                         end = data_end + (rev * self.index.entry_size)
                     if self._sidedatafile:
                         sidedata_end = self.sidedata_cut_off(rev)
                         transaction.add(self._sidedatafile, sidedata_end)
                     transaction.add(self._indexfile, end)
                     if self._docket is not None:
                         # XXX we could, leverage the docket while stripping. However it is
                         # not powerfull enough at the time of this comment
                         self._docket.index_end = end
                         self._docket.data_end = data_end
                         self._docket.sidedata_end = sidedata_end
                         self._docket.write(transaction, stripping=True)
                     # then reset internal state in memory to forget those revisions
                     self._revisioncache = None
                     self._chaininfocache = util.lrucachedict(500)
                     self._segmentfile.clear_cache()
                     self._segmentfile_sidedata.clear_cache()
                     del self.index[rev:-1]
                 def checksize(self):
                     """Check size of index and data files
                     return a (dd, di) tuple.
                     - dd: extra bytes for the "data" file
                     - di: extra bytes for the "index" file
                     A healthy revlog will return (0, 0).
                     """
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         with self._datafp() as f:
                             f.seek(0, io.SEEK_END)
                             actual = f.tell()
                         dd = actual - expected
                     except FileNotFoundError:
                         dd = 0
                     try:
                         f = self.opener(self._indexfile)
                         f.seek(0, io.SEEK_END)
                         actual = f.tell()
                         f.close()
                         s = self.index.entry_size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except FileNotFoundError:
                         di = 0
                     return (dd, di)
                 def files(self):
                     res = [self._indexfile]
                     if self._docket_file is None:
                         if not self._inline:
                             res.append(self._datafile)
                     else:
                         res.append(self._docket_file)
                         res.extend(self._docket.old_index_filepaths(include_empty=False))
                         if self._docket.data_end:
                             res.append(self._datafile)
                         res.extend(self._docket.old_data_filepaths(include_empty=False))
                         if self._docket.sidedata_end:
                             res.append(self._sidedatafile)
                         res.extend(self._docket.old_sidedata_filepaths(include_empty=False))
                     return res
                 def emitrevisions(
                     self,
                     nodes,
                     nodesorder=None,
                     revisiondata=False,
                     assumehaveparentrevisions=False,
                     deltamode=repository.CG_DELTAMODE_STD,
                     sidedata_helpers=None,
                     debug_info=None,
                 ):
                     if nodesorder not in (b'nodes', b'storage', b'linear', None):
                         raise error.ProgrammingError(
                             b'unhandled value for nodesorder: %s' % nodesorder
                         )
                     if nodesorder is None and not self.delta_config.general_delta:
                         nodesorder = b'storage'
                     if (
                         not self._storedeltachains
                         and deltamode != repository.CG_DELTAMODE_PREV
                     ):
                         deltamode = repository.CG_DELTAMODE_FULL
                     return storageutil.emitrevisions(
                         self,
                         nodes,
                         nodesorder,
                         revlogrevisiondelta,
                         deltaparentfn=self.deltaparent,
                         candeltafn=self._candelta,
                         rawsizefn=self.rawsize,
                         revdifffn=self.revdiff,
                         flagsfn=self.flags,
                         deltamode=deltamode,
                         revisiondata=revisiondata,
                         assumehaveparentrevisions=assumehaveparentrevisions,
                         sidedata_helpers=sidedata_helpers,
                         debug_info=debug_info,
                     )
                 DELTAREUSEALWAYS = b'always'
                 DELTAREUSESAMEREVS = b'samerevs'
                 DELTAREUSENEVER = b'never'
                 DELTAREUSEFULLADD = b'fulladd'
                 DELTAREUSEALL = {b'always', b'samerevs', b'never', b'fulladd'}
                 def clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb=None,
                     deltareuse=DELTAREUSESAMEREVS,
                     forcedeltabothparents=None,
                     sidedata_helpers=None,
                 ):
                     """Copy this revlog to another, possibly with format changes.
                     The destination revlog will contain the same revisions and nodes.
                     However, it may not be bit-for-bit identical due to e.g. delta encoding
                     differences.
                     The ``deltareuse`` argument control how deltas from the existing revlog
                     are preserved in the destination revlog. The argument can have the
                     following values:
                     DELTAREUSEALWAYS
                        Deltas will always be reused (if possible), even if the destination
                        revlog would not select the same revisions for the delta. This is the
                        fastest mode of operation.
                     DELTAREUSESAMEREVS
                        Deltas will be reused if the destination revlog would pick the same
                        revisions for the delta. This mode strikes a balance between speed
                        and optimization.
                     DELTAREUSENEVER
                        Deltas will never be reused. This is the slowest mode of execution.
                        This mode can be used to recompute deltas (e.g. if the diff/delta
                        algorithm changes).
                     DELTAREUSEFULLADD
                        Revision will be re-added as if their were new content. This is
                        slower than DELTAREUSEALWAYS but allow more mechanism to kicks in.
                        eg: large file detection and handling.
                     Delta computation can be slow, so the choice of delta reuse policy can
                     significantly affect run time.
                     The default policy (``DELTAREUSESAMEREVS``) strikes a balance between
                     two extremes. Deltas will be reused if they are appropriate. But if the
                     delta could choose a better revision, it will do so. This means if you
                     are converting a non-generaldelta revlog to a generaldelta revlog,
                     deltas will be recomputed if the delta's parent isn't a parent of the
                     revision.
                     In addition to the delta policy, the ``forcedeltabothparents``
                     argument controls whether to force compute deltas against both parents
                     for merges. By default, the current default is used.
                     See `revlogutil.sidedata.get_sidedata_helpers` for the doc on
                     `sidedata_helpers`.
                     """
                     if deltareuse not in self.DELTAREUSEALL:
                         raise ValueError(
                             _(b'value for deltareuse invalid: %s') % deltareuse
                         )
                     if len(destrevlog):
                         raise ValueError(_(b'destination revlog is not empty'))
                     if getattr(self, 'filteredrevs', None):
                         raise ValueError(_(b'source revlog has filtered revisions'))
                     if getattr(destrevlog, 'filteredrevs', None):
                         raise ValueError(_(b'destination revlog has filtered revisions'))
                     # lazydelta and lazydeltabase controls whether to reuse a cached delta,
                     # if possible.
                     old_delta_config = destrevlog.delta_config
                     destrevlog.delta_config = destrevlog.delta_config.copy()
                     try:
                         if deltareuse == self.DELTAREUSEALWAYS:
                             destrevlog.delta_config.lazy_delta_base = True
                             destrevlog.delta_config.lazy_delta = True
                         elif deltareuse == self.DELTAREUSESAMEREVS:
                             destrevlog.delta_config.lazy_delta_base = False
                             destrevlog.delta_config.lazy_delta = True
                         elif deltareuse == self.DELTAREUSENEVER:
                             destrevlog.delta_config.lazy_delta_base = False
                             destrevlog.delta_config.lazy_delta = False
                         delta_both_parents = (
                             forcedeltabothparents or old_delta_config.delta_both_parents
                         )
                         destrevlog.delta_config.delta_both_parents = delta_both_parents
                         with self.reading():
                             self._clone(
                                 tr,
                                 destrevlog,
                                 addrevisioncb,
                                 deltareuse,
                                 forcedeltabothparents,
                                 sidedata_helpers,
                             )
                     finally:
                         destrevlog.delta_config = old_delta_config
                 def _clone(
                     self,
                     tr,
                     destrevlog,
                     addrevisioncb,
                     deltareuse,
                     forcedeltabothparents,
                     sidedata_helpers,
                 ):
                     """perform the core duty of `revlog.clone` after parameter processing"""
                     write_debug = None
                     if self.delta_config.debug_delta:
                         write_debug = tr._report
                     deltacomputer = deltautil.deltacomputer(
                         destrevlog,
                         write_debug=write_debug,
                     )
                     index = self.index
                     for rev in self:
                         entry = index[rev]
                         # Some classes override linkrev to take filtered revs into
                         # account. Use raw entry from index.
                         flags = entry[0] & 0xFFFF
                         linkrev = entry[4]
                         p1 = index[entry[5]][7]
                         p2 = index[entry[6]][7]
                         node = entry[7]
                         # (Possibly) reuse the delta from the revlog if allowed and
                         # the revlog chunk is a delta.
                         cachedelta = None
                         rawtext = None
                         if deltareuse == self.DELTAREUSEFULLADD:
                             text = self._revisiondata(rev)
                             sidedata = self.sidedata(rev)
                             if sidedata_helpers is not None:
                                 (sidedata, new_flags) = sidedatautil.run_sidedata_helpers(
                                     self, sidedata_helpers, sidedata, rev
                                 )
                                 flags = flags | new_flags[0] & ~new_flags[1]
                             destrevlog.addrevision(
                                 text,
                                 tr,
                                 linkrev,
                                 p1,
                                 p2,
                                 cachedelta=cachedelta,
                                 node=node,
                                 flags=flags,
                                 deltacomputer=deltacomputer,
                                 sidedata=sidedata,
                             )
                         else:
                             if destrevlog.delta_config.lazy_delta:
                                 dp = self.deltaparent(rev)
                                 if dp != nullrev:
                                     cachedelta = (dp, bytes(self._chunk(rev)))
                             sidedata = None
                             if not cachedelta:
+                                try:
                                     rawtext = self._revisiondata(rev)
+                                except error.CensoredNodeError as censored:
+                                    assert flags & REVIDX_ISCENSORED
+                                    rawtext = censored.tombstone
                                 sidedata = self.sidedata(rev)
                             if sidedata is None:
                                 sidedata = self.sidedata(rev)
                             if sidedata_helpers is not None:
                                 (sidedata, new_flags) = sidedatautil.run_sidedata_helpers(
                                     self, sidedata_helpers, sidedata, rev
                                 )
                                 flags = flags | new_flags[0] & ~new_flags[1]
                             with destrevlog._writing(tr):
                                 destrevlog._addrevision(
                                     node,
                                     rawtext,
                                     tr,
                                     linkrev,
                                     p1,
                                     p2,
                                     flags,
                                     cachedelta,
                                     deltacomputer=deltacomputer,
                                     sidedata=sidedata,
                                 )
                         if addrevisioncb:
                             addrevisioncb(self, rev, node)
                 def censorrevision(self, tr, censornode, tombstone=b''):
                     if self._format_version == REVLOGV0:
                         raise error.RevlogError(
                             _(b'cannot censor with version %d revlogs')
                             % self._format_version
                         )
                     elif self._format_version == REVLOGV1:
                         rewrite.v1_censor(self, tr, censornode, tombstone)
                     else:
                         rewrite.v2_censor(self, tr, censornode, tombstone)
                 def verifyintegrity(self, state):
                     """Verifies the integrity of the revlog.
                     Yields ``revlogproblem`` instances describing problems that are
                     found.
                     """
                     dd, di = self.checksize()
                     if dd:
                         yield revlogproblem(error=_(b'data length off by %d bytes') % dd)
                     if di:
                         yield revlogproblem(error=_(b'index contains %d extra bytes') % di)
                     version = self._format_version
                     # The verifier tells us what version revlog we should be.
                     if version != state[b'expectedversion']:
                         yield revlogproblem(
                             warning=_(b"warning: '%s' uses revlog format %d; expected %d")
                             % (self.display_id, version, state[b'expectedversion'])
                         )
                     state[b'skipread'] = set()
                     state[b'safe_renamed'] = set()
                     for rev in self:
                         node = self.node(rev)
                         # Verify contents. 4 cases to care about:
                         #
                         #   common: the most common case
                         #   rename: with a rename
                         #   meta: file content starts with b'\1\n', the metadata
                         #         header defined in filelog.py, but without a rename
                         #   ext: content stored externally
                         #
                         # More formally, their differences are shown below:
                         #
                         #                       | common | rename | meta  | ext
                         #  -------------------------------------------------------
                         #   flags()             | 0      | 0      | 0     | not 0
                         #   renamed()           | False  | True   | False | ?
                         #   rawtext[0:2]=='\1\n'| False  | True   | True  | ?
                         #
                         # "rawtext" means the raw text stored in revlog data, which
                         # could be retrieved by "rawdata(rev)". "text"
                         # mentioned below is "revision(rev)".
                         #
                         # There are 3 different lengths stored physically:
                         #  1. L1: rawsize, stored in revlog index
                         #  2. L2: len(rawtext), stored in revlog data
                         #  3. L3: len(text), stored in revlog data if flags==0, or
                         #     possibly somewhere else if flags!=0
                         #
                         # L1 should be equal to L2. L3 could be different from them.
                         # "text" may or may not affect commit hash depending on flag
                         # processors (see flagutil.addflagprocessor).
                         #
                         #              | common  | rename | meta  | ext
                         # -------------------------------------------------
                         #    rawsize() | L1      | L1     | L1    | L1
                         #       size() | L1      | L2-LM  | L1(*) | L1 (?)
                         # len(rawtext) | L2      | L2     | L2    | L2
                         #    len(text) | L2      | L2     | L2    | L3
                         #  len(read()) | L2      | L2-LM  | L2-LM | L3 (?)
                         #
                         # LM:  length of metadata, depending on rawtext
                         # (*): not ideal, see comment in filelog.size
                         # (?): could be "- len(meta)" if the resolved content has
                         #      rename metadata
                         #
                         # Checks needed to be done:
                         #  1. length check: L1 == L2, in all cases.
                         #  2. hash check: depending on flag processor, we may need to
                         #     use either "text" (external), or "rawtext" (in revlog).
                         try:
                             skipflags = state.get(b'skipflags', 0)
                             if skipflags:
                                 skipflags &= self.flags(rev)
                             _verify_revision(self, skipflags, state, node)
                             l1 = self.rawsize(rev)
                             l2 = len(self.rawdata(node))
                             if l1 != l2:
                                 yield revlogproblem(
                                     error=_(b'unpacked size is %d, %d expected') % (l2, l1),
                                     node=node,
                                 )
                         except error.CensoredNodeError:
                             if state[b'erroroncensored']:
                                 yield revlogproblem(
                                     error=_(b'censored file data'), node=node
                                 )
                                 state[b'skipread'].add(node)
                         except Exception as e:
                             yield revlogproblem(
                                 error=_(b'unpacking %s: %s')
                                 % (short(node), stringutil.forcebytestr(e)),
                                 node=node,
                             )
                             state[b'skipread'].add(node)
                 def storageinfo(
                     self,
                     exclusivefiles=False,
                     sharedfiles=False,
                     revisionscount=False,
                     trackedsize=False,
                     storedsize=False,
                 ):
                     d = {}
                     if exclusivefiles:
                         d[b'exclusivefiles'] = [(self.opener, self._indexfile)]
                         if not self._inline:
                             d[b'exclusivefiles'].append((self.opener, self._datafile))
                     if sharedfiles:
                         d[b'sharedfiles'] = []
                     if revisionscount:
                         d[b'revisionscount'] = len(self)
                     if trackedsize:
                         d[b'trackedsize'] = sum(map(self.rawsize, iter(self)))
                     if storedsize:
                         d[b'storedsize'] = sum(
                             self.opener.stat(path).st_size for path in self.files()
                         )
                     return d
                 def rewrite_sidedata(self, transaction, helpers, startrev, endrev):
                     if not self.feature_config.has_side_data:
                         return
                     # revlog formats with sidedata support does not support inline
                     assert not self._inline
                     if not helpers[1] and not helpers[2]:
                         # Nothing to generate or remove
                         return
                     new_entries = []
                     # append the new sidedata
                     with self._writing(transaction):
                         ifh, dfh, sdfh = self._writinghandles
                         dfh.seek(self._docket.sidedata_end, os.SEEK_SET)
                         current_offset = sdfh.tell()
                         for rev in range(startrev, endrev + 1):
                             entry = self.index[rev]
                             new_sidedata, flags = sidedatautil.run_sidedata_helpers(
                                 store=self,
                                 sidedata_helpers=helpers,
                                 sidedata={},
                                 rev=rev,
                             )
                             serialized_sidedata = sidedatautil.serialize_sidedata(
                                 new_sidedata
                             )
                             sidedata_compression_mode = COMP_MODE_INLINE
                             if serialized_sidedata and self.feature_config.has_side_data:
                                 sidedata_compression_mode = COMP_MODE_PLAIN
                                 h, comp_sidedata = self.compress(serialized_sidedata)
                                 if (
                                     h != b'u'
                                     and comp_sidedata[0] != b'\0'
                                     and len(comp_sidedata) < len(serialized_sidedata)
                                 ):
                                     assert not h
                                     if (
                                         comp_sidedata[0]
                                         == self._docket.default_compression_header
                                     ):
                                         sidedata_compression_mode = COMP_MODE_DEFAULT
                                         serialized_sidedata = comp_sidedata
                                     else:
                                         sidedata_compression_mode = COMP_MODE_INLINE
                                         serialized_sidedata = comp_sidedata
                             if entry[8] != 0 or entry[9] != 0:
                                 # rewriting entries that already have sidedata is not
                                 # supported yet, because it introduces garbage data in the
                                 # revlog.
                                 msg = b"rewriting existing sidedata is not supported yet"
                                 raise error.Abort(msg)
                             # Apply (potential) flags to add and to remove after running
                             # the sidedata helpers
                             new_offset_flags = entry[0] | flags[0] & ~flags[1]
                             entry_update = (
                                 current_offset,
                                 len(serialized_sidedata),
                                 new_offset_flags,
                                 sidedata_compression_mode,
                             )
                             # the sidedata computation might have move the file cursors around
                             sdfh.seek(current_offset, os.SEEK_SET)
                             sdfh.write(serialized_sidedata)
                             new_entries.append(entry_update)
                             current_offset += len(serialized_sidedata)
                             self._docket.sidedata_end = sdfh.tell()
                         # rewrite the new index entries
                         ifh.seek(startrev * self.index.entry_size)
                         for i, e in enumerate(new_entries):
                             rev = startrev + i
                             self.index.replace_sidedata_info(rev, *e)
                             packed = self.index.entry_binary(rev)
                             if rev == 0 and self._docket is None:
                                 header = self._format_flags | self._format_version
                                 header = self.index.pack_header(header)
                                 packed = header + packed
                             ifh.write(packed)

             #require no-reposimplestore
             #testcases revlogv1 revlogv2
             #if revlogv2
               $ cat >> $HGRCPATH <<EOF
               > [experimental]
               > revlogv2=enable-unstable-format-and-corrupt-my-data
               > EOF
             #endif
               $ cp $HGRCPATH $HGRCPATH.orig
             Create repo with unimpeachable content
               $ hg init r
               $ cd r
               $ echo 'Initially untainted file' > target
               $ echo 'Normal file here' > bystander
               $ hg add target bystander
               $ hg ci -m init
             Clone repo so we can test pull later
               $ cd ..
               $ hg clone r rpull
               updating to branch default
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ cd r
             Introduce content which will ultimately require censorship. Name the first
             censored node C1, second C2, and so on
               $ echo 'Tainted file' > target
               $ echo 'Passwords: hunter2' >> target
               $ hg ci -m taint target
               $ C1=`hg id --debug -i`
               $ echo 'hunter3' >> target
               $ echo 'Normal file v2' > bystander
               $ hg ci -m moretaint target bystander
               $ C2=`hg id --debug -i`
             Add a new sanitized versions to correct our mistake. Name the first head H1,
             the second head H2, and so on
               $ echo 'Tainted file is now sanitized' > target
               $ hg ci -m sanitized target
               $ H1=`hg id --debug -i`
               $ hg update -r $C2
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ echo 'Tainted file now super sanitized' > target
               $ hg ci -m 'super sanitized' target
               created new head
               $ H2=`hg id --debug -i`
             Verify target contents before censorship at each revision
               $ hg cat -r $H1 target | head -n 10
               Tainted file is now sanitized
               $ hg cat -r $H2 target | head -n 10
               Tainted file now super sanitized
               $ hg cat -r $C2 target | head -n 10
               Tainted file
               Passwords: hunter2
               hunter3
               $ hg cat -r $C1 target | head -n 10
               Tainted file
               Passwords: hunter2
               $ hg cat -r 0 target | head -n 10
               Initially untainted file
             Censor revision with 2 offenses
             (this also tests file pattern matching: path relative to cwd case)
               $ mkdir -p foo/bar/baz
               $ hg --config extensions.censor= --cwd foo/bar/baz censor -r $C2 -t "remove password" ../../../target
               $ hg cat -r $H1 target | head -n 10
               Tainted file is now sanitized
               $ hg cat -r $H2 target | head -n 10
               Tainted file now super sanitized
               $ hg cat -r $C2 target | head -n 10
               abort: censored node: 1e0247a9a4b7
               (set censor.policy to ignore errors)
               $ hg cat -r $C1 target | head -n 10
               Tainted file
               Passwords: hunter2
               $ hg cat -r 0 target | head -n 10
               Initially untainted file
             Censor revision with 1 offense
             (this also tests file pattern matching: with 'path:' scheme)
               $ hg --config extensions.censor= --cwd foo/bar/baz censor -r $C1 path:target
               $ hg cat -r $H1 target | head -n 10
               Tainted file is now sanitized
               $ hg cat -r $H2 target | head -n 10
               Tainted file now super sanitized
               $ hg cat -r $C2 target | head -n 10
               abort: censored node: 1e0247a9a4b7
               (set censor.policy to ignore errors)
               $ hg cat -r $C1 target | head -n 10
               abort: censored node: 613bc869fceb
               (set censor.policy to ignore errors)
               $ hg cat -r 0 target | head -n 10
               Initially untainted file
             Can only checkout target at uncensored revisions, -X is workaround for --all
               $ hg revert -r $C2 target | head -n 10
               abort: censored node: 1e0247a9a4b7
               (set censor.policy to ignore errors)
               $ hg revert -r $C1 target | head -n 10
               abort: censored node: 613bc869fceb
               (set censor.policy to ignore errors)
               $ hg revert -r $C1 --all
               reverting bystander
               reverting target
               abort: censored node: 613bc869fceb
               (set censor.policy to ignore errors)
               [255]
               $ hg revert -r $C1 --all -X target
               $ cat target | head -n 10
               Tainted file now super sanitized
               $ hg revert -r 0 --all
               reverting target
               $ cat target | head -n 10
               Initially untainted file
               $ hg revert -r $H2 --all
               reverting bystander
               reverting target
               $ cat target | head -n 10
               Tainted file now super sanitized
             Uncensored file can be viewed at any revision
               $ hg cat -r $H1 bystander | head -n 10
               Normal file v2
               $ hg cat -r $C2 bystander | head -n 10
               Normal file v2
               $ hg cat -r $C1 bystander | head -n 10
               Normal file here
               $ hg cat -r 0 bystander | head -n 10
               Normal file here
             Can update to children of censored revision
               $ hg update -r $H1
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ cat target | head -n 10
               Tainted file is now sanitized
               $ hg update -r $H2
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ cat target | head -n 10
               Tainted file now super sanitized
             Set censor policy to abort in trusted $HGRC so hg verify fails
               $ cp $HGRCPATH.orig $HGRCPATH
               $ cat >> $HGRCPATH <<EOF
               > [censor]
               > policy = abort
               > EOF
             Repo fails verification due to censorship
               $ hg verify
               checking changesets
               checking manifests
               crosschecking files in changesets and manifests
               checking files
                target@1: censored file data
                target@2: censored file data
               not checking dirstate because of previous errors
               checked 5 changesets with 7 changes to 2 files
 integrity errors encountered!
               (first damaged changeset appears to be 1)
               [1]
             Cannot update to revision with censored data
               $ hg update -r $C2
               abort: censored node: 1e0247a9a4b7
               (set censor.policy to ignore errors)
               [255]
               $ hg update -r $C1
               abort: censored node: 613bc869fceb
               (set censor.policy to ignore errors)
               [255]
               $ hg update -r 0
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ hg update -r $H2
 files updated, 0 files merged, 0 files removed, 0 files unresolved
             Set censor policy to ignore in trusted $HGRC so hg verify passes
               $ cp $HGRCPATH.orig $HGRCPATH
               $ cat >> $HGRCPATH <<EOF
               > [censor]
               > policy = ignore
               > EOF
             Repo passes verification with warnings with explicit config
               $ hg verify -q
             May update to revision with censored data with explicit config
               $ hg update -r $C2
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ cat target | head -n 10
               $ hg update -r $C1
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ cat target | head -n 10
               $ hg update -r 0
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ cat target | head -n 10
               Initially untainted file
               $ hg update -r $H2
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ cat target | head -n 10
               Tainted file now super sanitized
             Can merge in revision with censored data. Test requires one branch of history
             with the file censored, but we can't censor at a head, so advance H1.
               $ hg update -r $H1
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ C3=$H1
               $ echo 'advanced head H1' > target
               $ hg ci -m 'advance head H1' target
               $ H1=`hg id --debug -i`
               $ hg --config extensions.censor= censor -r $C3 target
               $ hg update -r $H2
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ hg merge -r $C3
               merging target
 files updated, 1 files merged, 0 files removed, 0 files unresolved
               (branch merge, don't forget to commit)
             Revisions present in repository heads may not be censored
               $ hg update -C -r $H2
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ hg --config extensions.censor= censor -r $H2 target
               abort: cannot censor file in heads (78a8fc215e79)
               (clean/delete and commit first)
               [255]
               $ echo 'twiddling thumbs' > bystander
               $ hg ci -m 'bystander commit'
               $ H2=`hg id --debug -i`
               $ hg --config extensions.censor= censor -r "$H2^" target
               abort: cannot censor file in heads (efbe78065929)
               (clean/delete and commit first)
               [255]
             Cannot censor working directory
               $ echo 'seriously no passwords' > target
               $ hg ci -m 'extend second head arbitrarily' target
               $ H2=`hg id --debug -i`
               $ hg update -r "$H2^"
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ hg --config extensions.censor= censor -r . target
               abort: cannot censor working directory
               (clean/delete/update first)
               [255]
               $ hg update -r $H2
 files updated, 0 files merged, 0 files removed, 0 files unresolved
             Can re-add file after being deleted + censored
               $ C4=$H2
               $ hg rm target
               $ hg ci -m 'delete target so it may be censored'
               $ H2=`hg id --debug -i`
               $ hg --config extensions.censor= censor -r $C4 target
               $ hg cat -r $C4 target | head -n 10
               $ hg cat -r "$H2^^" target | head -n 10
               Tainted file now super sanitized
               $ echo 'fresh start' > target
               $ hg add target
               $ hg ci -m reincarnated target
               $ H2=`hg id --debug -i`
               $ hg cat -r $H2 target | head -n 10
               fresh start
               $ hg cat -r "$H2^" target | head -n 10
               target: no such file in rev 452ec1762369
               $ hg cat -r $C4 target | head -n 10
               $ hg cat -r "$H2^^^" target | head -n 10
               Tainted file now super sanitized
             Can censor after revlog has expanded to no longer permit inline storage
               $ for x in `"$PYTHON" $TESTDIR/seq.py 0 50000`
               > do
               >   echo "Password: hunter$x" >> target
               > done
               $ hg ci -m 'add 100k passwords'
               $ H2=`hg id --debug -i`
               $ C5=$H2
               $ hg revert -r "$H2^" target
               $ hg ci -m 'cleaned 100k passwords'
               $ H2=`hg id --debug -i`
               $ hg --config extensions.censor= censor -r $C5 target
               $ hg cat -r $C5 target | head -n 10
               $ hg cat -r $H2 target | head -n 10
               fresh start
             Repo with censored nodes can be cloned and cloned nodes are censored
               $ cd ..
               $ hg clone r rclone
               updating to branch default
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ cd rclone
               $ hg cat -r $H1 target | head -n 10
               advanced head H1
               $ hg cat -r $H2~5 target | head -n 10
               Tainted file now super sanitized
               $ hg cat -r $C2 target | head -n 10
               $ hg cat -r $C1 target | head -n 10
               $ hg cat -r 0 target | head -n 10
               Initially untainted file
               $ hg verify -q
             Repo cloned before tainted content introduced can pull censored nodes
               $ cd ../rpull
               $ hg cat -r tip target | head -n 10
               Initially untainted file
               $ hg verify -q
               $ hg pull -r $H1 -r $H2
               pulling from $TESTTMP/r
               searching for changes
               adding changesets
               adding manifests
               adding file changes
               added 11 changesets with 11 changes to 2 files (+1 heads)
               new changesets 186fb27560c3:683e4645fded
               (run 'hg heads' to see heads, 'hg merge' to merge)
               $ hg update 4
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ cat target | head -n 10
               Tainted file now super sanitized
               $ hg cat -r $H1 target | head -n 10
               advanced head H1
               $ hg cat -r $H2~5 target | head -n 10
               Tainted file now super sanitized
               $ hg cat -r $C2 target | head -n 10
               $ hg cat -r $C1 target | head -n 10
               $ hg cat -r 0 target | head -n 10
               Initially untainted file
               $ hg verify -q
             Censored nodes can be pushed if they censor previously unexchanged nodes
               $ echo 'Passwords: hunter2hunter2' > target
               $ hg ci -m 're-add password from clone' target
               created new head
               $ H3=`hg id --debug -i`
               $ REV=$H3
               $ echo 'Re-sanitized; nothing to see here' > target
               $ hg ci -m 're-sanitized' target
               $ H2=`hg id --debug -i`
               $ CLEANREV=$H2
               $ hg cat -r $REV target | head -n 10
               Passwords: hunter2hunter2
               $ hg --config extensions.censor= censor -r $REV target
               $ hg cat -r $REV target | head -n 10
               $ hg cat -r $CLEANREV target | head -n 10
               Re-sanitized; nothing to see here
               $ hg push -f -r $H2
               pushing to $TESTTMP/r
               searching for changes
               adding changesets
               adding manifests
               adding file changes
               added 2 changesets with 2 changes to 1 files (+1 heads)
               $ cd ../r
               $ hg cat -r $REV target | head -n 10
               $ hg cat -r $CLEANREV target | head -n 10
               Re-sanitized; nothing to see here
               $ hg update $CLEANREV
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ cat target | head -n 10
               Re-sanitized; nothing to see here
             Censored nodes can be bundled up and unbundled in another repo
               $ hg bundle --base 0 ../pwbundle
 changesets found
               $ cd ../rclone
               $ hg unbundle ../pwbundle
               adding changesets
               adding manifests
               adding file changes
               added 2 changesets with 2 changes to 2 files (+1 heads)
               new changesets 075be80ac777:dcbaf17bf3a1 (2 drafts)
               (run 'hg heads .' to see heads, 'hg merge' to merge)
               $ hg cat -r $REV target | head -n 10
               $ hg cat -r $CLEANREV target | head -n 10
               Re-sanitized; nothing to see here
               $ hg update $CLEANREV
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ cat target | head -n 10
               Re-sanitized; nothing to see here
               $ hg verify -q
             Grepping only warns, doesn't error out
               $ cd ../rpull
               $ hg grep 'Normal file'
               bystander:Normal file v2
               $ hg grep nothing
               target:Re-sanitized; nothing to see here
               $ hg grep --diff 'Normal file'
               cannot search in censored file: target:7
               cannot search in censored file: target:10
               cannot search in censored file: target:12
               bystander:6:-:Normal file v2
               cannot search in censored file: target:1
               cannot search in censored file: target:2
               cannot search in censored file: target:3
               bystander:2:-:Normal file here
               bystander:2:+:Normal file v2
               bystander:0:+:Normal file here
               $ hg grep --diff nothing
               cannot search in censored file: target:7
               cannot search in censored file: target:10
               cannot search in censored file: target:12
               target:13:+:Re-sanitized; nothing to see here
               cannot search in censored file: target:1
               cannot search in censored file: target:2
               cannot search in censored file: target:3
             Censored nodes can be imported on top of censored nodes, consecutively
               $ hg init ../rimport
               $ hg bundle --base 1 ../rimport/splitbundle
 changesets found
               $ cd ../rimport
               $ hg pull -r $H1 -r $H2 ../r
               pulling from ../r
               adding changesets
               adding manifests
               adding file changes
               added 8 changesets with 10 changes to 2 files (+1 heads)
               new changesets e97f55b2665a:dcbaf17bf3a1
               (run 'hg heads' to see heads, 'hg merge' to merge)
               $ hg unbundle splitbundle
               adding changesets
               adding manifests
               adding file changes
               added 6 changesets with 5 changes to 2 files (+1 heads)
               new changesets efbe78065929:683e4645fded (6 drafts)
               (run 'hg heads .' to see heads, 'hg merge' to merge)
               $ hg update $H2
 files updated, 0 files merged, 0 files removed, 0 files unresolved
               $ cat target | head -n 10
               Re-sanitized; nothing to see here
               $ hg verify -q
               $ cd ../r
             Can import bundle where first revision of a file is censored
               $ hg init ../rinit
               $ hg --config extensions.censor= censor -r 0 target
               $ hg bundle -r 0 --base null ../rinit/initbundle
 changesets found
               $ cd ../rinit
               $ hg unbundle initbundle
               adding changesets
               adding manifests
               adding file changes
               added 1 changesets with 2 changes to 2 files
               new changesets e97f55b2665a (1 drafts)
               (run 'hg update' to get a working copy)
               $ hg cat -r 0 target | head -n 10
             #if revlogv2
             Testing feature that does not work in revlog v1
             ===============================================
             Censoring a revision that is used as delta base
             -----------------------------------------------
               $ cd ..
               $ hg init censor-with-delta
               $ cd censor-with-delta
               $ echo root > target
               $ hg add target
               $ hg commit -m root
               $ B0=`hg id --debug -i`
               $ for x in `"$PYTHON" $TESTDIR/seq.py 0 50000`
               > do
               >   echo "Password: hunter$x" >> target
               > done
               $ hg ci -m 'write a long file'
               $ B1=`hg id --debug -i`
               $ echo 'small change (should create a delta)' >> target
               $ hg ci -m 'create a delta over the password'
             (should show that the last revision is a delta, not a snapshot)
               $ B2=`hg id --debug -i`
             Make sure the last revision is a delta against the revision we will censor
               $ hg debugdeltachain target -T '{rev} {chainid} {chainlen} {prevrev}\n'
 1 1 -1
 2 1 -1
 2 2 1
             Censor the file
               $ hg cat -r $B1 target | wc -l
                *50002 (re)
               $ hg --config extensions.censor= censor -r $B1 target
               $ hg cat -r $B1 target | wc -l
                *0 (re)
             Check the children is fine
               $ hg cat -r $B2 target | wc -l
                *50003 (re)
             #endif
             Testing repository upgrade with censors revision
             ================================================
               $ cd ../rclone
             With the "abort" policy
             =======================
               $ hg verify --config censor.policy=ignore
               checking changesets
               checking manifests
               crosschecking files in changesets and manifests
               checking files
               checking dirstate
               checked 14 changesets with 15 changes to 2 files
               $ hg debugupgraderepo --run --quiet \
               > --optimize re-delta-parent \
               > --config censor.policy=abort
               upgrade will perform the following actions:
               requirements
                  preserved: * (glob)
               optimisations: re-delta-parent
               processed revlogs:
                 - all-filelogs
                 - changelog
                 - manifest
-              transaction abort!
-              rollback completed
-              abort: file censored target:613bc869fceb
-              [255]
               $ hg verify  --config censor.policy=ignore
               checking changesets
               checking manifests
               crosschecking files in changesets and manifests
               checking files
               checking dirstate
               checked 14 changesets with 15 changes to 2 files
             With the "ignore" policy
             ========================
               $ hg verify --config censor.policy=ignore
               checking changesets
               checking manifests
               crosschecking files in changesets and manifests
               checking files
               checking dirstate
               checked 14 changesets with 15 changes to 2 files
               $ hg debugupgraderepo --run --quiet \
               > --optimize re-delta-parent \
               > --config censor.policy=ignore
               upgrade will perform the following actions:
               requirements
                  preserved: * (glob)
               optimisations: re-delta-parent
               processed revlogs:
                 - all-filelogs
                 - changelog
                 - manifest
-              transaction abort!
-              rollback completed
-              abort: file censored target:613bc869fceb
-              [255]
               $ hg verify --config censor.policy=ignore
               checking changesets
               checking manifests
               crosschecking files in changesets and manifests
               checking files
               checking dirstate
               checked 14 changesets with 15 changes to 2 files