upstream/mercurial-mirror Commit - r26117:4dc5b51f

1

# revlog.py - storage back-end for mercurial

1

# revlog.py - storage back-end for mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

"""Storage back-end for Mercurial.

8

"""Storage back-end for Mercurial.

9

10

This provides efficient delta storage with O(1) retrieve and append

10

This provides efficient delta storage with O(1) retrieve and append

11

and O(changes) merge between branches.

11

and O(changes) merge between branches.

12

"""

12

"""

13

14

# import stuff from node for others to import from revlog

14

# import stuff from node for others to import from revlog

15

import collections

15

import collections

16

from node import bin, hex, nullid, nullrev

16

from node import bin, hex, nullid, nullrev

17

from i18n import _

17

from i18n import _

18

import ancestor, mdiff, parsers, error, util, templatefilters

18

import ancestor, mdiff, parsers, error, util, templatefilters

19

import struct, zlib, errno

19

import struct, zlib, errno

20

21

_pack = struct.pack

21

_pack = struct.pack

22

_unpack = struct.unpack

22

_unpack = struct.unpack

23

_compress = zlib.compress

23

_compress = zlib.compress

24

_decompress = zlib.decompress

24

_decompress = zlib.decompress

25

_sha = util.sha1

25

_sha = util.sha1

26

27

# revlog header flags

27

# revlog header flags

28

REVLOGV0 = 0

28

REVLOGV0 = 0

29

REVLOGNG = 1

29

REVLOGNG = 1

30

REVLOGNGINLINEDATA = (1 << 16)

30

REVLOGNGINLINEDATA = (1 << 16)

31

REVLOGGENERALDELTA = (1 << 17)

31

REVLOGGENERALDELTA = (1 << 17)

32

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

32

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

33

REVLOG_DEFAULT_FORMAT = REVLOGNG

33

REVLOG_DEFAULT_FORMAT = REVLOGNG

34

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

34

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

35

REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGGENERALDELTA

35

REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGGENERALDELTA

36

37

# revlog index flags

37

# revlog index flags

38

REVIDX_ISCENSORED = (1 << 15) # revision has censor metadata, must be verified

38

REVIDX_ISCENSORED = (1 << 15) # revision has censor metadata, must be verified

39

REVIDX_DEFAULT_FLAGS = 0

39

REVIDX_DEFAULT_FLAGS = 0

40

REVIDX_KNOWN_FLAGS = REVIDX_ISCENSORED

40

REVIDX_KNOWN_FLAGS = REVIDX_ISCENSORED

41

42

# max size of revlog with inline data

42

# max size of revlog with inline data

43

_maxinline = 131072

43

_maxinline = 131072

44

_chunksize = 1048576

44

_chunksize = 1048576

45

46

RevlogError = error.RevlogError

46

RevlogError = error.RevlogError

47

LookupError = error.LookupError

47

LookupError = error.LookupError

48

CensoredNodeError = error.CensoredNodeError

48

CensoredNodeError = error.CensoredNodeError

49

50

def getoffset(q):

50

def getoffset(q):

51

return int(q >> 16)

51

return int(q >> 16)

52

53

def gettype(q):

53

def gettype(q):

54

return int(q & 0xFFFF)

54

return int(q & 0xFFFF)

55

56

def offset_type(offset, type):

56

def offset_type(offset, type):

57

return long(long(offset) << 16 | type)

57

return long(long(offset) << 16 | type)

58

59

_nullhash = _sha(nullid)

59

_nullhash = _sha(nullid)

60

61

def hash(text, p1, p2):

61

def hash(text, p1, p2):

62

"""generate a hash from the given text and its parent hashes

62

"""generate a hash from the given text and its parent hashes

63

64

This hash combines both the current file contents and its history

64

This hash combines both the current file contents and its history

65

in a manner that makes it easy to distinguish nodes with the same

65

in a manner that makes it easy to distinguish nodes with the same

66

content in the revision graph.

66

content in the revision graph.

67

"""

67

"""

68

# As of now, if one of the parent node is null, p2 is null

68

# As of now, if one of the parent node is null, p2 is null

69

if p2 == nullid:

69

if p2 == nullid:

70

# deep copy of a hash is faster than creating one

70

# deep copy of a hash is faster than creating one

71

s = _nullhash.copy()

71

s = _nullhash.copy()

72

s.update(p1)

72

s.update(p1)

73

else:

73

else:

74

# none of the parent nodes are nullid

74

# none of the parent nodes are nullid

75

l = [p1, p2]

75

l = [p1, p2]

76

l.sort()

76

l.sort()

77

s = _sha(l[0])

77

s = _sha(l[0])

78

s.update(l[1])

78

s.update(l[1])

79

s.update(text)

79

s.update(text)

80

return s.digest()

80

return s.digest()

81

82

def decompress(bin):

82

def decompress(bin):

83

""" decompress the given input """

83

""" decompress the given input """

84

if not bin:

84

if not bin:

85

return bin

85

return bin

86

t = bin[0]

86

t = bin[0]

87

if t == '\0':

87

if t == '\0':

88

return bin

88

return bin

89

if t == 'x':

89

if t == 'x':

90

try:

90

try:

91

return _decompress(bin)

91

return _decompress(bin)

92

except zlib.error as e:

92

except zlib.error as e:

93

raise RevlogError(_("revlog decompress error: %s") % str(e))

93

raise RevlogError(_("revlog decompress error: %s") % str(e))

94

if t == 'u':

94

if t == 'u':

95

return bin[1:]

95

return bin[1:]

96

raise RevlogError(_("unknown compression type %r") % t)

96

raise RevlogError(_("unknown compression type %r") % t)

97

98

# index v0:

98

# index v0:

99

# 4 bytes: offset

99

# 4 bytes: offset

100

# 4 bytes: compressed length

100

# 4 bytes: compressed length

101

# 4 bytes: base rev

101

# 4 bytes: base rev

102

# 4 bytes: link rev

102

# 4 bytes: link rev

103

# 20 bytes: parent 1 nodeid

103

# 20 bytes: parent 1 nodeid

104

# 20 bytes: parent 2 nodeid

104

# 20 bytes: parent 2 nodeid

105

# 20 bytes: nodeid

105

# 20 bytes: nodeid

106

indexformatv0 = ">4l20s20s20s"

106

indexformatv0 = ">4l20s20s20s"

107

108

class revlogoldio(object):

108

class revlogoldio(object):

109

def __init__(self):

109

def __init__(self):

110

self.size = struct.calcsize(indexformatv0)

110

self.size = struct.calcsize(indexformatv0)

111

112

def parseindex(self, data, inline):

112

def parseindex(self, data, inline):

113

s = self.size

113

s = self.size

114

index = []

114

index = []

115

nodemap = {nullid: nullrev}

115

nodemap = {nullid: nullrev}

116

n = off = 0

116

n = off = 0

117

l = len(data)

117

l = len(data)

118

while off + s <= l:

118

while off + s <= l:

119

cur = data[off:off + s]

119

cur = data[off:off + s]

120

off += s

120

off += s

121

e = _unpack(indexformatv0, cur)

121

e = _unpack(indexformatv0, cur)

122

# transform to revlogv1 format

122

# transform to revlogv1 format

123

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

123

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

124

nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])

124

nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])

125

index.append(e2)

125

index.append(e2)

126

nodemap[e[6]] = n

126

nodemap[e[6]] = n

127

n += 1

127

n += 1

128

129

# add the magic null revision at -1

129

# add the magic null revision at -1

130

index.append((0, 0, 0, -1, -1, -1, -1, nullid))

130

index.append((0, 0, 0, -1, -1, -1, -1, nullid))

131

132

return index, nodemap, None

132

return index, nodemap, None

133

134

def packentry(self, entry, node, version, rev):

134

def packentry(self, entry, node, version, rev):

135

if gettype(entry[0]):

135

if gettype(entry[0]):

136

raise RevlogError(_("index entry flags need RevlogNG"))

136

raise RevlogError(_("index entry flags need RevlogNG"))

137

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

137

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

138

node(entry[5]), node(entry[6]), entry[7])

138

node(entry[5]), node(entry[6]), entry[7])

139

return _pack(indexformatv0, *e2)

139

return _pack(indexformatv0, *e2)

140

141

# index ng:

141

# index ng:

142

# 6 bytes: offset

142

# 6 bytes: offset

143

# 2 bytes: flags

143

# 2 bytes: flags

144

# 4 bytes: compressed length

144

# 4 bytes: compressed length

145

# 4 bytes: uncompressed length

145

# 4 bytes: uncompressed length

146

# 4 bytes: base rev

146

# 4 bytes: base rev

147

# 4 bytes: link rev

147

# 4 bytes: link rev

148

# 4 bytes: parent 1 rev

148

# 4 bytes: parent 1 rev

149

# 4 bytes: parent 2 rev

149

# 4 bytes: parent 2 rev

150

# 32 bytes: nodeid

150

# 32 bytes: nodeid

151

indexformatng = ">Qiiiiii20s12x"

151

indexformatng = ">Qiiiiii20s12x"

152

versionformat = ">I"

152

versionformat = ">I"

153

154

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

154

# corresponds to uncompressed length of indexformatng (2 gigs, 4-byte

155

# signed integer)

155

# signed integer)

156

_maxentrysize = 0x7fffffff

156

_maxentrysize = 0x7fffffff

157

158

class revlogio(object):

158

class revlogio(object):

159

def __init__(self):

159

def __init__(self):

160

self.size = struct.calcsize(indexformatng)

160

self.size = struct.calcsize(indexformatng)

161

162

def parseindex(self, data, inline):

162

def parseindex(self, data, inline):

163

# call the C implementation to parse the index data

163

# call the C implementation to parse the index data

164

index, cache = parsers.parse_index2(data, inline)

164

index, cache = parsers.parse_index2(data, inline)

165

return index, getattr(index, 'nodemap', None), cache

165

return index, getattr(index, 'nodemap', None), cache

166

167

def packentry(self, entry, node, version, rev):

167

def packentry(self, entry, node, version, rev):

168

p = _pack(indexformatng, *entry)

168

p = _pack(indexformatng, *entry)

169

if rev == 0:

169

if rev == 0:

170

p = _pack(versionformat, version) + p[4:]

170

p = _pack(versionformat, version) + p[4:]

171

return p

171

return p

172

173

class revlog(object):

173

class revlog(object):

174

"""

174

"""

175

the underlying revision storage object

175

the underlying revision storage object

176

177

A revlog consists of two parts, an index and the revision data.

177

A revlog consists of two parts, an index and the revision data.

178

179

The index is a file with a fixed record size containing

179

The index is a file with a fixed record size containing

180

information on each revision, including its nodeid (hash), the

180

information on each revision, including its nodeid (hash), the

181

nodeids of its parents, the position and offset of its data within

181

nodeids of its parents, the position and offset of its data within

182

the data file, and the revision it's based on. Finally, each entry

182

the data file, and the revision it's based on. Finally, each entry

183

contains a linkrev entry that can serve as a pointer to external

183

contains a linkrev entry that can serve as a pointer to external

184

data.

184

data.

185

186

The revision data itself is a linear collection of data chunks.

186

The revision data itself is a linear collection of data chunks.

187

Each chunk represents a revision and is usually represented as a

187

Each chunk represents a revision and is usually represented as a

188

delta against the previous chunk. To bound lookup time, runs of

188

delta against the previous chunk. To bound lookup time, runs of

189

deltas are limited to about 2 times the length of the original

189

deltas are limited to about 2 times the length of the original

190

version data. This makes retrieval of a version proportional to

190

version data. This makes retrieval of a version proportional to

191

its size, or O(1) relative to the number of revisions.

191

its size, or O(1) relative to the number of revisions.

192

193

Both pieces of the revlog are written to in an append-only

193

Both pieces of the revlog are written to in an append-only

194

fashion, which means we never need to rewrite a file to insert or

194

fashion, which means we never need to rewrite a file to insert or

195

remove data, and can use some simple techniques to avoid the need

195

remove data, and can use some simple techniques to avoid the need

196

for locking while reading.

196

for locking while reading.

197

"""

197

"""

198

def __init__(self, opener, indexfile):

198

def __init__(self, opener, indexfile):

199

"""

199

"""

200

create a revlog object

200

create a revlog object

201

202

opener is a function that abstracts the file opening operation

202

opener is a function that abstracts the file opening operation

203

and can be used to implement COW semantics or the like.

203

and can be used to implement COW semantics or the like.

204

"""

204

"""

205

self.indexfile = indexfile

205

self.indexfile = indexfile

206

self.datafile = indexfile[:-2] + ".d"

206

self.datafile = indexfile[:-2] + ".d"

207

self.opener = opener

207

self.opener = opener

208

self._cache = None

208

self._cache = None

209

self._basecache = None

209

self._basecache = None

210

self._chunkcache = (0, '')

210

self._chunkcache = (0, '')

211

self._chunkcachesize = 65536

211

self._chunkcachesize = 65536

212

self._maxchainlen = None

212

self._maxchainlen = None

213

self.index = []

213

self.index = []

214

self._pcache = {}

214

self._pcache = {}

215

self._nodecache = {nullid: nullrev}

215

self._nodecache = {nullid: nullrev}

216

self._nodepos = None

216

self._nodepos = None

217

218

v = REVLOG_DEFAULT_VERSION

218

v = REVLOG_DEFAULT_VERSION

219

opts = getattr(opener, 'options', None)

219

opts = getattr(opener, 'options', None)

220

if opts is not None:

220

if opts is not None:

221

if 'revlogv1' in opts:

221

if 'revlogv1' in opts:

222

if 'generaldelta' in opts:

222

if 'generaldelta' in opts:

223

v |= REVLOGGENERALDELTA

223

v |= REVLOGGENERALDELTA

224

else:

224

else:

225

v = 0

225

v = 0

226

if 'chunkcachesize' in opts:

226

if 'chunkcachesize' in opts:

227

self._chunkcachesize = opts['chunkcachesize']

227

self._chunkcachesize = opts['chunkcachesize']

228

if 'maxchainlen' in opts:

228

if 'maxchainlen' in opts:

229

self._maxchainlen = opts['maxchainlen']

229

self._maxchainlen = opts['maxchainlen']

230

231

if self._chunkcachesize <= 0:

231

if self._chunkcachesize <= 0:

232

raise RevlogError(_('revlog chunk cache size %r is not greater '

232

raise RevlogError(_('revlog chunk cache size %r is not greater '

233

'than 0') % self._chunkcachesize)

233

'than 0') % self._chunkcachesize)

234

elif self._chunkcachesize & (self._chunkcachesize - 1):

234

elif self._chunkcachesize & (self._chunkcachesize - 1):

235

raise RevlogError(_('revlog chunk cache size %r is not a power '

235

raise RevlogError(_('revlog chunk cache size %r is not a power '

236

'of 2') % self._chunkcachesize)

236

'of 2') % self._chunkcachesize)

237

238

i = ''

238

i = ''

239

self._initempty = True

239

self._initempty = True

240

try:

240

try:

241

f = self.opener(self.indexfile)

241

f = self.opener(self.indexfile)

242

i = f.read()

242

i = f.read()

243

f.close()

243

f.close()

244

if len(i) > 0:

244

if len(i) > 0:

245

v = struct.unpack(versionformat, i[:4])[0]

245

v = struct.unpack(versionformat, i[:4])[0]

246

self._initempty = False

246

self._initempty = False

247

except IOError as inst:

247

except IOError as inst:

248

if inst.errno != errno.ENOENT:

248

if inst.errno != errno.ENOENT:

249

raise

249

raise

250

251

self.version = v

251

self.version = v

252

self._inline = v & REVLOGNGINLINEDATA

252

self._inline = v & REVLOGNGINLINEDATA

253

self._generaldelta = v & REVLOGGENERALDELTA

253

self._generaldelta = v & REVLOGGENERALDELTA

254

flags = v & ~0xFFFF

254

flags = v & ~0xFFFF

255

fmt = v & 0xFFFF

255

fmt = v & 0xFFFF

256

if fmt == REVLOGV0 and flags:

256

if fmt == REVLOGV0 and flags:

257

raise RevlogError(_("index %s unknown flags %#04x for format v0")

257

raise RevlogError(_("index %s unknown flags %#04x for format v0")

258

% (self.indexfile, flags >> 16))

258

% (self.indexfile, flags >> 16))

259

elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:

259

elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:

260

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

260

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

261

% (self.indexfile, flags >> 16))

261

% (self.indexfile, flags >> 16))

262

elif fmt > REVLOGNG:

262

elif fmt > REVLOGNG:

263

raise RevlogError(_("index %s unknown format %d")

263

raise RevlogError(_("index %s unknown format %d")

264

% (self.indexfile, fmt))

264

% (self.indexfile, fmt))

265

266

self._io = revlogio()

266

self._io = revlogio()

267

if self.version == REVLOGV0:

267

if self.version == REVLOGV0:

268

self._io = revlogoldio()

268

self._io = revlogoldio()

269

try:

269

try:

270

d = self._io.parseindex(i, self._inline)

270

d = self._io.parseindex(i, self._inline)

271

except (ValueError, IndexError):

271

except (ValueError, IndexError):

272

raise RevlogError(_("index %s is corrupted") % (self.indexfile))

272

raise RevlogError(_("index %s is corrupted") % (self.indexfile))

273

self.index, nodemap, self._chunkcache = d

273

self.index, nodemap, self._chunkcache = d

274

if nodemap is not None:

274

if nodemap is not None:

275

self.nodemap = self._nodecache = nodemap

275

self.nodemap = self._nodecache = nodemap

276

if not self._chunkcache:

276

if not self._chunkcache:

277

self._chunkclear()

277

self._chunkclear()

278

# revnum -> (chain-length, sum-delta-length)

278

# revnum -> (chain-length, sum-delta-length)

279

self._chaininfocache = {}

279

self._chaininfocache = {}

280

281

def tip(self):

281

def tip(self):

282

return self.node(len(self.index) - 2)

282

return self.node(len(self.index) - 2)

283

def __contains__(self, rev):

283

def __contains__(self, rev):

284

return 0 <= rev < len(self)

284

return 0 <= rev < len(self)

285

def __len__(self):

285

def __len__(self):

286

return len(self.index) - 1

286

return len(self.index) - 1

287

def __iter__(self):

287

def __iter__(self):

288

return iter(xrange(len(self)))

288

return iter(xrange(len(self)))

289

def revs(self, start=0, stop=None):

289

def revs(self, start=0, stop=None):

290

"""iterate over all rev in this revlog (from start to stop)"""

290

"""iterate over all rev in this revlog (from start to stop)"""

291

step = 1

291

step = 1

292

if stop is not None:

292

if stop is not None:

293

if start > stop:

293

if start > stop:

294

step = -1

294

step = -1

295

stop += step

295

stop += step

296

else:

296

else:

297

stop = len(self)

297

stop = len(self)

298

return xrange(start, stop, step)

298

return xrange(start, stop, step)

299

300

@util.propertycache

300

@util.propertycache

301

def nodemap(self):

301

def nodemap(self):

302

self.rev(self.node(0))

302

self.rev(self.node(0))

303

return self._nodecache

303

return self._nodecache

304

305

def hasnode(self, node):

305

def hasnode(self, node):

306

try:

306

try:

307

self.rev(node)

307

self.rev(node)

308

return True

308

return True

309

except KeyError:

309

except KeyError:

310

return False

310

return False

311

312

def clearcaches(self):

312

def clearcaches(self):

313

try:

313

try:

314

self._nodecache.clearcaches()

314

self._nodecache.clearcaches()

315

except AttributeError:

315

except AttributeError:

316

self._nodecache = {nullid: nullrev}

316

self._nodecache = {nullid: nullrev}

317

self._nodepos = None

317

self._nodepos = None

318

319

def rev(self, node):

319

def rev(self, node):

320

try:

320

try:

321

return self._nodecache[node]

321

return self._nodecache[node]

322

except TypeError:

322

except TypeError:

323

raise

323

raise

324

except RevlogError:

324

except RevlogError:

325

# parsers.c radix tree lookup failed

325

# parsers.c radix tree lookup failed

326

raise LookupError(node, self.indexfile, _('no node'))

326

raise LookupError(node, self.indexfile, _('no node'))

327

except KeyError:

327

except KeyError:

328

# pure python cache lookup failed

328

# pure python cache lookup failed

329

n = self._nodecache

329

n = self._nodecache

330

i = self.index

330

i = self.index

331

p = self._nodepos

331

p = self._nodepos

332

if p is None:

332

if p is None:

333

p = len(i) - 2

333

p = len(i) - 2

334

for r in xrange(p, -1, -1):

334

for r in xrange(p, -1, -1):

335

v = i[r][7]

335

v = i[r][7]

336

n[v] = r

336

n[v] = r

337

if v == node:

337

if v == node:

338

self._nodepos = r - 1

338

self._nodepos = r - 1

339

return r

339

return r

340

raise LookupError(node, self.indexfile, _('no node'))

340

raise LookupError(node, self.indexfile, _('no node'))

341

342

def node(self, rev):

342

def node(self, rev):

343

return self.index[rev][7]

343

return self.index[rev][7]

344

def linkrev(self, rev):

344

def linkrev(self, rev):

345

return self.index[rev][4]

345

return self.index[rev][4]

346

def parents(self, node):

346

def parents(self, node):

347

i = self.index

347

i = self.index

348

d = i[self.rev(node)]

348

d = i[self.rev(node)]

349

return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline

349

return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline

350

def parentrevs(self, rev):

350

def parentrevs(self, rev):

351

return self.index[rev][5:7]

351

return self.index[rev][5:7]

352

def start(self, rev):

352

def start(self, rev):

353

return int(self.index[rev][0] >> 16)

353

return int(self.index[rev][0] >> 16)

354

def end(self, rev):

354

def end(self, rev):

355

return self.start(rev) + self.length(rev)

355

return self.start(rev) + self.length(rev)

356

def length(self, rev):

356

def length(self, rev):

357

return self.index[rev][1]

357

return self.index[rev][1]

358

def chainbase(self, rev):

358

def chainbase(self, rev):

359

index = self.index

359

index = self.index

360

base = index[rev][3]

360

base = index[rev][3]

361

while base != rev:

361

while base != rev:

362

rev = base

362

rev = base

363

base = index[rev][3]

363

base = index[rev][3]

364

return base

364

return base

365

def chainlen(self, rev):

365

def chainlen(self, rev):

366

return self._chaininfo(rev)[0]

366

return self._chaininfo(rev)[0]

367

368

def _chaininfo(self, rev):

368

def _chaininfo(self, rev):

369

chaininfocache = self._chaininfocache

369

chaininfocache = self._chaininfocache

370

if rev in chaininfocache:

370

if rev in chaininfocache:

371

return chaininfocache[rev]

371

return chaininfocache[rev]

372

index = self.index

372

index = self.index

373

generaldelta = self._generaldelta

373

generaldelta = self._generaldelta

374

iterrev = rev

374

iterrev = rev

375

e = index[iterrev]

375

e = index[iterrev]

376

clen = 0

376

clen = 0

377

compresseddeltalen = 0

377

compresseddeltalen = 0

378

while iterrev != e[3]:

378

while iterrev != e[3]:

379

clen += 1

379

clen += 1

380

compresseddeltalen += e[1]

380

compresseddeltalen += e[1]

381

if generaldelta:

381

if generaldelta:

382

iterrev = e[3]

382

iterrev = e[3]

383

else:

383

else:

384

iterrev -= 1

384

iterrev -= 1

385

if iterrev in chaininfocache:

385

if iterrev in chaininfocache:

386

t = chaininfocache[iterrev]

386

t = chaininfocache[iterrev]

387

clen += t[0]

387

clen += t[0]

388

compresseddeltalen += t[1]

388

compresseddeltalen += t[1]

389

break

389

break

390

e = index[iterrev]

390

e = index[iterrev]

391

else:

391

else:

392

# Add text length of base since decompressing that also takes

392

# Add text length of base since decompressing that also takes

393

# work. For cache hits the length is already included.

393

# work. For cache hits the length is already included.

394

compresseddeltalen += e[1]

394

compresseddeltalen += e[1]

395

r = (clen, compresseddeltalen)

395

r = (clen, compresseddeltalen)

396

chaininfocache[rev] = r

396

chaininfocache[rev] = r

397

return r

397

return r

398

399

def flags(self, rev):

399

def flags(self, rev):

400

return self.index[rev][0] & 0xFFFF

400

return self.index[rev][0] & 0xFFFF

401

def rawsize(self, rev):

401

def rawsize(self, rev):

402

"""return the length of the uncompressed text for a given revision"""

402

"""return the length of the uncompressed text for a given revision"""

403

l = self.index[rev][2]

403

l = self.index[rev][2]

404

if l >= 0:

404

if l >= 0:

405

return l

405

return l

406

407

t = self.revision(self.node(rev))

407

t = self.revision(self.node(rev))

408

return len(t)

408

return len(t)

409

size = rawsize

409

size = rawsize

410

411

def ancestors(self, revs, stoprev=0, inclusive=False):

411

def ancestors(self, revs, stoprev=0, inclusive=False):

412

"""Generate the ancestors of 'revs' in reverse topological order.

412

"""Generate the ancestors of 'revs' in reverse topological order.

413

Does not generate revs lower than stoprev.

413

Does not generate revs lower than stoprev.

414

415

See the documentation for ancestor.lazyancestors for more details."""

415

See the documentation for ancestor.lazyancestors for more details."""

416

417

return ancestor.lazyancestors(self.parentrevs, revs, stoprev=stoprev,

417

return ancestor.lazyancestors(self.parentrevs, revs, stoprev=stoprev,

418

inclusive=inclusive)

418

inclusive=inclusive)

419

420

def descendants(self, revs):

420

def descendants(self, revs):

421

"""Generate the descendants of 'revs' in revision order.

421

"""Generate the descendants of 'revs' in revision order.

422

423

Yield a sequence of revision numbers starting with a child of

423

Yield a sequence of revision numbers starting with a child of

424

some rev in revs, i.e., each revision is *not* considered a

424

some rev in revs, i.e., each revision is *not* considered a

425

descendant of itself. Results are ordered by revision number (a

425

descendant of itself. Results are ordered by revision number (a

426

topological sort)."""

426

topological sort)."""

427

first = min(revs)

427

first = min(revs)

428

if first == nullrev:

428

if first == nullrev:

429

for i in self:

429

for i in self:

430

yield i

430

yield i

431

return

431

return

432

433

seen = set(revs)

433

seen = set(revs)

434

for i in self.revs(start=first + 1):

434

for i in self.revs(start=first + 1):

435

for x in self.parentrevs(i):

435

for x in self.parentrevs(i):

436

if x != nullrev and x in seen:

436

if x != nullrev and x in seen:

437

seen.add(i)

437

seen.add(i)

438

yield i

438

yield i

439

break

439

break

440

441

def findcommonmissing(self, common=None, heads=None):

441

def findcommonmissing(self, common=None, heads=None):

442

"""Return a tuple of the ancestors of common and the ancestors of heads

442

"""Return a tuple of the ancestors of common and the ancestors of heads

443

that are not ancestors of common. In revset terminology, we return the

443

that are not ancestors of common. In revset terminology, we return the

444

tuple:

444

tuple:

445

446

::common, (::heads) - (::common)

446

::common, (::heads) - (::common)

447

448

The list is sorted by revision number, meaning it is

448

The list is sorted by revision number, meaning it is

449

topologically sorted.

449

topologically sorted.

450

451

'heads' and 'common' are both lists of node IDs. If heads is

451

'heads' and 'common' are both lists of node IDs. If heads is

452

not supplied, uses all of the revlog's heads. If common is not

452

not supplied, uses all of the revlog's heads. If common is not

453

supplied, uses nullid."""

453

supplied, uses nullid."""

454

if common is None:

454

if common is None:

455

common = [nullid]

455

common = [nullid]

456

if heads is None:

456

if heads is None:

457

heads = self.heads()

457

heads = self.heads()

458

459

common = [self.rev(n) for n in common]

459

common = [self.rev(n) for n in common]

460

heads = [self.rev(n) for n in heads]

460

heads = [self.rev(n) for n in heads]

461

462

# we want the ancestors, but inclusive

462

# we want the ancestors, but inclusive

463

class lazyset(object):

463

class lazyset(object):

464

def __init__(self, lazyvalues):

464

def __init__(self, lazyvalues):

465

self.addedvalues = set()

465

self.addedvalues = set()

466

self.lazyvalues = lazyvalues

466

self.lazyvalues = lazyvalues

467

468

def __contains__(self, value):

468

def __contains__(self, value):

469

return value in self.addedvalues or value in self.lazyvalues

469

return value in self.addedvalues or value in self.lazyvalues

470

471

def __iter__(self):

471

def __iter__(self):

472

added = self.addedvalues

472

added = self.addedvalues

473

for r in added:

473

for r in added:

474

yield r

474

yield r

475

for r in self.lazyvalues:

475

for r in self.lazyvalues:

476

if not r in added:

476

if not r in added:

477

yield r

477

yield r

478

479

def add(self, value):

479

def add(self, value):

480

self.addedvalues.add(value)

480

self.addedvalues.add(value)

481

482

def update(self, values):

482

def update(self, values):

483

self.addedvalues.update(values)

483

self.addedvalues.update(values)

484

485

has = lazyset(self.ancestors(common))

485

has = lazyset(self.ancestors(common))

486

has.add(nullrev)

486

has.add(nullrev)

487

has.update(common)

487

has.update(common)

488

489

# take all ancestors from heads that aren't in has

489

# take all ancestors from heads that aren't in has

490

missing = set()

490

missing = set()

491

visit = collections.deque(r for r in heads if r not in has)

491

visit = collections.deque(r for r in heads if r not in has)

492

while visit:

492

while visit:

493

r = visit.popleft()

493

r = visit.popleft()

494

if r in missing:

494

if r in missing:

495

continue

495

continue

496

else:

496

else:

497

missing.add(r)

497

missing.add(r)

498

for p in self.parentrevs(r):

498

for p in self.parentrevs(r):

499

if p not in has:

499

if p not in has:

500

visit.append(p)

500

visit.append(p)

501

missing = list(missing)

501

missing = list(missing)

502

missing.sort()

502

missing.sort()

503

return has, [self.node(r) for r in missing]

503

return has, [self.node(r) for r in missing]

504

505

def incrementalmissingrevs(self, common=None):

505

def incrementalmissingrevs(self, common=None):

506

"""Return an object that can be used to incrementally compute the

506

"""Return an object that can be used to incrementally compute the

507

revision numbers of the ancestors of arbitrary sets that are not

507

revision numbers of the ancestors of arbitrary sets that are not

508

ancestors of common. This is an ancestor.incrementalmissingancestors

508

ancestors of common. This is an ancestor.incrementalmissingancestors

509

object.

509

object.

510

511

'common' is a list of revision numbers. If common is not supplied, uses

511

'common' is a list of revision numbers. If common is not supplied, uses

512

nullrev.

512

nullrev.

513

"""

513

"""

514

if common is None:

514

if common is None:

515

common = [nullrev]

515

common = [nullrev]

516

517

return ancestor.incrementalmissingancestors(self.parentrevs, common)

517

return ancestor.incrementalmissingancestors(self.parentrevs, common)

518

519

def findmissingrevs(self, common=None, heads=None):

519

def findmissingrevs(self, common=None, heads=None):

520

"""Return the revision numbers of the ancestors of heads that

520

"""Return the revision numbers of the ancestors of heads that

521

are not ancestors of common.

521

are not ancestors of common.

522

523

More specifically, return a list of revision numbers corresponding to

523

More specifically, return a list of revision numbers corresponding to

524

nodes N such that every N satisfies the following constraints:

524

nodes N such that every N satisfies the following constraints:

525

526

1. N is an ancestor of some node in 'heads'

526

1. N is an ancestor of some node in 'heads'

527

2. N is not an ancestor of any node in 'common'

527

2. N is not an ancestor of any node in 'common'

528

529

The list is sorted by revision number, meaning it is

529

The list is sorted by revision number, meaning it is

530

topologically sorted.

530

topologically sorted.

531

532

'heads' and 'common' are both lists of revision numbers. If heads is

532

'heads' and 'common' are both lists of revision numbers. If heads is

533

not supplied, uses all of the revlog's heads. If common is not

533

not supplied, uses all of the revlog's heads. If common is not

534

supplied, uses nullid."""

534

supplied, uses nullid."""

535

if common is None:

535

if common is None:

536

common = [nullrev]

536

common = [nullrev]

537

if heads is None:

537

if heads is None:

538

heads = self.headrevs()

538

heads = self.headrevs()

539

540

inc = self.incrementalmissingrevs(common=common)

540

inc = self.incrementalmissingrevs(common=common)

541

return inc.missingancestors(heads)

541

return inc.missingancestors(heads)

542

543

def findmissing(self, common=None, heads=None):

543

def findmissing(self, common=None, heads=None):

544

"""Return the ancestors of heads that are not ancestors of common.

544

"""Return the ancestors of heads that are not ancestors of common.

545

546

More specifically, return a list of nodes N such that every N

546

More specifically, return a list of nodes N such that every N

547

satisfies the following constraints:

547

satisfies the following constraints:

548

549

1. N is an ancestor of some node in 'heads'

549

1. N is an ancestor of some node in 'heads'

550

2. N is not an ancestor of any node in 'common'

550

2. N is not an ancestor of any node in 'common'

551

552

The list is sorted by revision number, meaning it is

552

The list is sorted by revision number, meaning it is

553

topologically sorted.

553

topologically sorted.

554

555

'heads' and 'common' are both lists of node IDs. If heads is

555

'heads' and 'common' are both lists of node IDs. If heads is

556

not supplied, uses all of the revlog's heads. If common is not

556

not supplied, uses all of the revlog's heads. If common is not

557

supplied, uses nullid."""

557

supplied, uses nullid."""

558

if common is None:

558

if common is None:

559

common = [nullid]

559

common = [nullid]

560

if heads is None:

560

if heads is None:

561

heads = self.heads()

561

heads = self.heads()

562

563

common = [self.rev(n) for n in common]

563

common = [self.rev(n) for n in common]

564

heads = [self.rev(n) for n in heads]

564

heads = [self.rev(n) for n in heads]

565

566

inc = self.incrementalmissingrevs(common=common)

566

inc = self.incrementalmissingrevs(common=common)

567

return [self.node(r) for r in inc.missingancestors(heads)]

567

return [self.node(r) for r in inc.missingancestors(heads)]

568

569

def nodesbetween(self, roots=None, heads=None):

569

def nodesbetween(self, roots=None, heads=None):

570

"""Return a topological path from 'roots' to 'heads'.

570

"""Return a topological path from 'roots' to 'heads'.

571

572

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

572

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

573

topologically sorted list of all nodes N that satisfy both of

573

topologically sorted list of all nodes N that satisfy both of

574

these constraints:

574

these constraints:

575

576

1. N is a descendant of some node in 'roots'

576

1. N is a descendant of some node in 'roots'

577

2. N is an ancestor of some node in 'heads'

577

2. N is an ancestor of some node in 'heads'

578

579

Every node is considered to be both a descendant and an ancestor

579

Every node is considered to be both a descendant and an ancestor

580

of itself, so every reachable node in 'roots' and 'heads' will be

580

of itself, so every reachable node in 'roots' and 'heads' will be

581

included in 'nodes'.

581

included in 'nodes'.

582

583

'outroots' is the list of reachable nodes in 'roots', i.e., the

583

'outroots' is the list of reachable nodes in 'roots', i.e., the

584

subset of 'roots' that is returned in 'nodes'. Likewise,

584

subset of 'roots' that is returned in 'nodes'. Likewise,

585

'outheads' is the subset of 'heads' that is also in 'nodes'.

585

'outheads' is the subset of 'heads' that is also in 'nodes'.

586

587

'roots' and 'heads' are both lists of node IDs. If 'roots' is

587

'roots' and 'heads' are both lists of node IDs. If 'roots' is

588

unspecified, uses nullid as the only root. If 'heads' is

588

unspecified, uses nullid as the only root. If 'heads' is

589

unspecified, uses list of all of the revlog's heads."""

589

unspecified, uses list of all of the revlog's heads."""

590

nonodes = ([], [], [])

590

nonodes = ([], [], [])

591

if roots is not None:

591

if roots is not None:

592

roots = list(roots)

592

roots = list(roots)

593

if not roots:

593

if not roots:

594

return nonodes

594

return nonodes

595

lowestrev = min([self.rev(n) for n in roots])

595

lowestrev = min([self.rev(n) for n in roots])

596

else:

596

else:

597

roots = [nullid] # Everybody's a descendant of nullid

597

roots = [nullid] # Everybody's a descendant of nullid

598

lowestrev = nullrev

598

lowestrev = nullrev

599

if (lowestrev == nullrev) and (heads is None):

599

if (lowestrev == nullrev) and (heads is None):

600

# We want _all_ the nodes!

600

# We want _all_ the nodes!

601

return ([self.node(r) for r in self], [nullid], list(self.heads()))

601

return ([self.node(r) for r in self], [nullid], list(self.heads()))

602

if heads is None:

602

if heads is None:

603

# All nodes are ancestors, so the latest ancestor is the last

603

# All nodes are ancestors, so the latest ancestor is the last

604

# node.

604

# node.

605

highestrev = len(self) - 1

605

highestrev = len(self) - 1

606

# Set ancestors to None to signal that every node is an ancestor.

606

# Set ancestors to None to signal that every node is an ancestor.

607

ancestors = None

607

ancestors = None

608

# Set heads to an empty dictionary for later discovery of heads

608

# Set heads to an empty dictionary for later discovery of heads

609

heads = {}

609

heads = {}

610

else:

610

else:

611

heads = list(heads)

611

heads = list(heads)

612

if not heads:

612

if not heads:

613

return nonodes

613

return nonodes

614

ancestors = set()

614

ancestors = set()

615

# Turn heads into a dictionary so we can remove 'fake' heads.

615

# Turn heads into a dictionary so we can remove 'fake' heads.

616

# Also, later we will be using it to filter out the heads we can't

616

# Also, later we will be using it to filter out the heads we can't

617

# find from roots.

617

# find from roots.

618

heads = dict.fromkeys(heads, False)

618

heads = dict.fromkeys(heads, False)

619

# Start at the top and keep marking parents until we're done.

619

# Start at the top and keep marking parents until we're done.

620

nodestotag = set(heads)

620

nodestotag = set(heads)

621

# Remember where the top was so we can use it as a limit later.

621

# Remember where the top was so we can use it as a limit later.

622

highestrev = max([self.rev(n) for n in nodestotag])

622

highestrev = max([self.rev(n) for n in nodestotag])

623

while nodestotag:

623

while nodestotag:

624

# grab a node to tag

624

# grab a node to tag

625

n = nodestotag.pop()

625

n = nodestotag.pop()

626

# Never tag nullid

626

# Never tag nullid

627

if n == nullid:

627

if n == nullid:

628

continue

628

continue

629

# A node's revision number represents its place in a

629

# A node's revision number represents its place in a

630

# topologically sorted list of nodes.

630

# topologically sorted list of nodes.

631

r = self.rev(n)

631

r = self.rev(n)

632

if r >= lowestrev:

632

if r >= lowestrev:

633

if n not in ancestors:

633

if n not in ancestors:

634

# If we are possibly a descendant of one of the roots

634

# If we are possibly a descendant of one of the roots

635

# and we haven't already been marked as an ancestor

635

# and we haven't already been marked as an ancestor

636

ancestors.add(n) # Mark as ancestor

636

ancestors.add(n) # Mark as ancestor

637

# Add non-nullid parents to list of nodes to tag.

637

# Add non-nullid parents to list of nodes to tag.

638

nodestotag.update([p for p in self.parents(n) if

638

nodestotag.update([p for p in self.parents(n) if

639

p != nullid])

639

p != nullid])

640

elif n in heads: # We've seen it before, is it a fake head?

640

elif n in heads: # We've seen it before, is it a fake head?

641

# So it is, real heads should not be the ancestors of

641

# So it is, real heads should not be the ancestors of

642

# any other heads.

642

# any other heads.

643

heads.pop(n)

643

heads.pop(n)

644

if not ancestors:

644

if not ancestors:

645

return nonodes

645

return nonodes

646

# Now that we have our set of ancestors, we want to remove any

646

# Now that we have our set of ancestors, we want to remove any

647

# roots that are not ancestors.

647

# roots that are not ancestors.

648

649

# If one of the roots was nullid, everything is included anyway.

649

# If one of the roots was nullid, everything is included anyway.

650

if lowestrev > nullrev:

650

if lowestrev > nullrev:

651

# But, since we weren't, let's recompute the lowest rev to not

651

# But, since we weren't, let's recompute the lowest rev to not

652

# include roots that aren't ancestors.

652

# include roots that aren't ancestors.

653

654

# Filter out roots that aren't ancestors of heads

654

# Filter out roots that aren't ancestors of heads

655

roots = [n for n in roots if n in ancestors]

655

roots = [n for n in roots if n in ancestors]

656

# Recompute the lowest revision

656

# Recompute the lowest revision

657

if roots:

657

if roots:

658

lowestrev = min([self.rev(n) for n in roots])

658

lowestrev = min([self.rev(n) for n in roots])

659

else:

659

else:

660

# No more roots? Return empty list

660

# No more roots? Return empty list

661

return nonodes

661

return nonodes

662

else:

662

else:

663

# We are descending from nullid, and don't need to care about

663

# We are descending from nullid, and don't need to care about

664

# any other roots.

664

# any other roots.

665

lowestrev = nullrev

665

lowestrev = nullrev

666

roots = [nullid]

666

roots = [nullid]

667

# Transform our roots list into a set.

667

# Transform our roots list into a set.

668

descendants = set(roots)

668

descendants = set(roots)

669

# Also, keep the original roots so we can filter out roots that aren't

669

# Also, keep the original roots so we can filter out roots that aren't

670

# 'real' roots (i.e. are descended from other roots).

670

# 'real' roots (i.e. are descended from other roots).

671

roots = descendants.copy()

671

roots = descendants.copy()

672

# Our topologically sorted list of output nodes.

672

# Our topologically sorted list of output nodes.

673

orderedout = []

673

orderedout = []

674

# Don't start at nullid since we don't want nullid in our output list,

674

# Don't start at nullid since we don't want nullid in our output list,

675

# and if nullid shows up in descendants, empty parents will look like

675

# and if nullid shows up in descendants, empty parents will look like

676

# they're descendants.

676

# they're descendants.

677

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

677

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

678

n = self.node(r)

678

n = self.node(r)

679

isdescendant = False

679

isdescendant = False

680

if lowestrev == nullrev: # Everybody is a descendant of nullid

680

if lowestrev == nullrev: # Everybody is a descendant of nullid

681

isdescendant = True

681

isdescendant = True

682

elif n in descendants:

682

elif n in descendants:

683

# n is already a descendant

683

# n is already a descendant

684

isdescendant = True

684

isdescendant = True

685

# This check only needs to be done here because all the roots

685

# This check only needs to be done here because all the roots

686

# will start being marked is descendants before the loop.

686

# will start being marked is descendants before the loop.

687

if n in roots:

687

if n in roots:

688

# If n was a root, check if it's a 'real' root.

688

# If n was a root, check if it's a 'real' root.

689

p = tuple(self.parents(n))

689

p = tuple(self.parents(n))

690

# If any of its parents are descendants, it's not a root.

690

# If any of its parents are descendants, it's not a root.

691

if (p[0] in descendants) or (p[1] in descendants):

691

if (p[0] in descendants) or (p[1] in descendants):

692

roots.remove(n)

692

roots.remove(n)

693

else:

693

else:

694

p = tuple(self.parents(n))

694

p = tuple(self.parents(n))

695

# A node is a descendant if either of its parents are

695

# A node is a descendant if either of its parents are

696

# descendants. (We seeded the dependents list with the roots

696

# descendants. (We seeded the dependents list with the roots

697

# up there, remember?)

697

# up there, remember?)

698

if (p[0] in descendants) or (p[1] in descendants):

698

if (p[0] in descendants) or (p[1] in descendants):

699

descendants.add(n)

699

descendants.add(n)

700

isdescendant = True

700

isdescendant = True

701

if isdescendant and ((ancestors is None) or (n in ancestors)):

701

if isdescendant and ((ancestors is None) or (n in ancestors)):

702

# Only include nodes that are both descendants and ancestors.

702

# Only include nodes that are both descendants and ancestors.

703

orderedout.append(n)

703

orderedout.append(n)

704

if (ancestors is not None) and (n in heads):

704

if (ancestors is not None) and (n in heads):

705

# We're trying to figure out which heads are reachable

705

# We're trying to figure out which heads are reachable

706

# from roots.

706

# from roots.

707

# Mark this head as having been reached

707

# Mark this head as having been reached

708

heads[n] = True

708

heads[n] = True

709

elif ancestors is None:

709

elif ancestors is None:

710

# Otherwise, we're trying to discover the heads.

710

# Otherwise, we're trying to discover the heads.

711

# Assume this is a head because if it isn't, the next step

711

# Assume this is a head because if it isn't, the next step

712

# will eventually remove it.

712

# will eventually remove it.

713

heads[n] = True

713

heads[n] = True

714

# But, obviously its parents aren't.

714

# But, obviously its parents aren't.

715

for p in self.parents(n):

715

for p in self.parents(n):

716

heads.pop(p, None)

716

heads.pop(p, None)

717

heads = [n for n, flag in heads.iteritems() if flag]

717

heads = [n for n, flag in heads.iteritems() if flag]

718

roots = list(roots)

718

roots = list(roots)

719

assert orderedout

719

assert orderedout

720

assert roots

720

assert roots

721

assert heads

721

assert heads

722

return (orderedout, roots, heads)

722

return (orderedout, roots, heads)

723

724

def headrevs(self):

724

def headrevs(self):

725

try:

725

try:

726

return self.index.headrevs()

726

return self.index.headrevs()

727

except AttributeError:

727

except AttributeError:

728

return self._headrevs()

728

return self._headrevs()

729

730

def computephases(self, roots):

730

def computephases(self, roots):

731

return self.index.computephasesmapsets(roots)

731

return self.index.computephasesmapsets(roots)

732

733

def _headrevs(self):

733

def _headrevs(self):

734

count = len(self)

734

count = len(self)

735

if not count:

735

if not count:

736

return [nullrev]

736

return [nullrev]

737

# we won't iter over filtered rev so nobody is a head at start

737

# we won't iter over filtered rev so nobody is a head at start

738

ishead = [0] * (count + 1)

738

ishead = [0] * (count + 1)

739

index = self.index

739

index = self.index

740

for r in self:

740

for r in self:

741

ishead[r] = 1 # I may be an head

741

ishead[r] = 1 # I may be an head

742

e = index[r]

742

e = index[r]

743

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

743

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

744

return [r for r, val in enumerate(ishead) if val]

744

return [r for r, val in enumerate(ishead) if val]

745

746

def heads(self, start=None, stop=None):

746

def heads(self, start=None, stop=None):

747

"""return the list of all nodes that have no children

747

"""return the list of all nodes that have no children

748

749

if start is specified, only heads that are descendants of

749

if start is specified, only heads that are descendants of

750

start will be returned

750

start will be returned

751

if stop is specified, it will consider all the revs from stop

751

if stop is specified, it will consider all the revs from stop

752

as if they had no children

752

as if they had no children

753

"""

753

"""

754

if start is None and stop is None:

754

if start is None and stop is None:

755

if not len(self):

755

if not len(self):

756

return [nullid]

756

return [nullid]

757

return [self.node(r) for r in self.headrevs()]

757

return [self.node(r) for r in self.headrevs()]

758

759

if start is None:

759

if start is None:

760

start = nullid

760

start = nullid

761

if stop is None:

761

if stop is None:

762

stop = []

762

stop = []

763

stoprevs = set([self.rev(n) for n in stop])

763

stoprevs = set([self.rev(n) for n in stop])

764

startrev = self.rev(start)

764

startrev = self.rev(start)

765

reachable = set((startrev,))

765

reachable = set((startrev,))

766

heads = set((startrev,))

766

heads = set((startrev,))

767

768

parentrevs = self.parentrevs

768

parentrevs = self.parentrevs

769

for r in self.revs(start=startrev + 1):

769

for r in self.revs(start=startrev + 1):

770

for p in parentrevs(r):

770

for p in parentrevs(r):

771

if p in reachable:

771

if p in reachable:

772

if r not in stoprevs:

772

if r not in stoprevs:

773

reachable.add(r)

773

reachable.add(r)

774

heads.add(r)

774

heads.add(r)

775

if p in heads and p not in stoprevs:

775

if p in heads and p not in stoprevs:

776

heads.remove(p)

776

heads.remove(p)

777

778

return [self.node(r) for r in heads]

778

return [self.node(r) for r in heads]

779

780

def children(self, node):

780

def children(self, node):

781

"""find the children of a given node"""

781

"""find the children of a given node"""

782

c = []

782

c = []

783

p = self.rev(node)

783

p = self.rev(node)

784

for r in self.revs(start=p + 1):

784

for r in self.revs(start=p + 1):

785

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

785

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

786

if prevs:

786

if prevs:

787

for pr in prevs:

787

for pr in prevs:

788

if pr == p:

788

if pr == p:

789

c.append(self.node(r))

789

c.append(self.node(r))

790

elif p == nullrev:

790

elif p == nullrev:

791

c.append(self.node(r))

791

c.append(self.node(r))

792

return c

792

return c

793

794

def descendant(self, start, end):

794

def descendant(self, start, end):

795

if start == nullrev:

795

if start == nullrev:

796

return True

796

return True

797

for i in self.descendants([start]):

797

for i in self.descendants([start]):

798

if i == end:

798

if i == end:

799

return True

799

return True

800

elif i > end:

800

elif i > end:

801

break

801

break

802

return False

802

return False

803

804

def commonancestorsheads(self, a, b):

804

def commonancestorsheads(self, a, b):

805

"""calculate all the heads of the common ancestors of nodes a and b"""

805

"""calculate all the heads of the common ancestors of nodes a and b"""

806

a, b = self.rev(a), self.rev(b)

806

a, b = self.rev(a), self.rev(b)

807

try:

807

try:

808

ancs = self.index.commonancestorsheads(a, b)

808

ancs = self.index.commonancestorsheads(a, b)

809

except (AttributeError, OverflowError): # C implementation failed

809

except (AttributeError, OverflowError): # C implementation failed

810

ancs = ancestor.commonancestorsheads(self.parentrevs, a, b)

810

ancs = ancestor.commonancestorsheads(self.parentrevs, a, b)

811

return map(self.node, ancs)

811

return map(self.node, ancs)

812

813

def isancestor(self, a, b):

813

def isancestor(self, a, b):

814

"""return True if node a is an ancestor of node b

814

"""return True if node a is an ancestor of node b

815

816

The implementation of this is trivial but the use of

816

The implementation of this is trivial but the use of

817

commonancestorsheads is not."""

817

commonancestorsheads is not."""

818

return a in self.commonancestorsheads(a, b)

818

return a in self.commonancestorsheads(a, b)

819

820

def ancestor(self, a, b):

820

def ancestor(self, a, b):

821

"""calculate the "best" common ancestor of nodes a and b"""

821

"""calculate the "best" common ancestor of nodes a and b"""

822

823

a, b = self.rev(a), self.rev(b)

823

a, b = self.rev(a), self.rev(b)

824

try:

824

try:

825

ancs = self.index.ancestors(a, b)

825

ancs = self.index.ancestors(a, b)

826

except (AttributeError, OverflowError):

826

except (AttributeError, OverflowError):

827

ancs = ancestor.ancestors(self.parentrevs, a, b)

827

ancs = ancestor.ancestors(self.parentrevs, a, b)

828

if ancs:

828

if ancs:

829

# choose a consistent winner when there's a tie

829

# choose a consistent winner when there's a tie

830

return min(map(self.node, ancs))

830

return min(map(self.node, ancs))

831

return nullid

831

return nullid

832

833

def _match(self, id):

833

def _match(self, id):

834

if isinstance(id, int):

834

if isinstance(id, int):

835

# rev

835

# rev

836

return self.node(id)

836

return self.node(id)

837

if len(id) == 20:

837

if len(id) == 20:

838

# possibly a binary node

838

# possibly a binary node

839

# odds of a binary node being all hex in ASCII are 1 in 10**25

839

# odds of a binary node being all hex in ASCII are 1 in 10**25

840

try:

840

try:

841

node = id

841

node = id

842

self.rev(node) # quick search the index

842

self.rev(node) # quick search the index

843

return node

843

return node

844

except LookupError:

844

except LookupError:

845

pass # may be partial hex id

845

pass # may be partial hex id

846

try:

846

try:

847

# str(rev)

847

# str(rev)

848

rev = int(id)

848

rev = int(id)

849

if str(rev) != id:

849

if str(rev) != id:

850

raise ValueError

850

raise ValueError

851

if rev < 0:

851

if rev < 0:

852

rev = len(self) + rev

852

rev = len(self) + rev

853

if rev < 0 or rev >= len(self):

853

if rev < 0 or rev >= len(self):

854

raise ValueError

854

raise ValueError

855

return self.node(rev)

855

return self.node(rev)

856

except (ValueError, OverflowError):

856

except (ValueError, OverflowError):

857

pass

857

pass

858

if len(id) == 40:

858

if len(id) == 40:

859

try:

859

try:

860

# a full hex nodeid?

860

# a full hex nodeid?

861

node = bin(id)

861

node = bin(id)

862

self.rev(node)

862

self.rev(node)

863

return node

863

return node

864

except (TypeError, LookupError):

864

except (TypeError, LookupError):

865

pass

865

pass

866

867

def _partialmatch(self, id):

867

def _partialmatch(self, id):

868

try:

868

try:

869

n = self.index.partialmatch(id)

869

n = self.index.partialmatch(id)

870

if n and self.hasnode(n):

870

if n and self.hasnode(n):

871

return n

871

return n

872

return None

872

return None

873

except RevlogError:

873

except RevlogError:

874

# parsers.c radix tree lookup gave multiple matches

874

# parsers.c radix tree lookup gave multiple matches

875

# fall through to slow path that filters hidden revisions

875

# fall through to slow path that filters hidden revisions

876

pass

876

pass

877

except (AttributeError, ValueError):

877

except (AttributeError, ValueError):

878

# we are pure python, or key was too short to search radix tree

878

# we are pure python, or key was too short to search radix tree

879

pass

879

pass

880

881

if id in self._pcache:

881

if id in self._pcache:

882

return self._pcache[id]

882

return self._pcache[id]

883

884

if len(id) < 40:

884

if len(id) < 40:

885

try:

885

try:

886

# hex(node)[:...]

886

# hex(node)[:...]

887

l = len(id) // 2 # grab an even number of digits

887

l = len(id) // 2 # grab an even number of digits

888

prefix = bin(id[:l * 2])

888

prefix = bin(id[:l * 2])

889

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

889

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

890

nl = [n for n in nl if hex(n).startswith(id) and

890

nl = [n for n in nl if hex(n).startswith(id) and

891

self.hasnode(n)]

891

self.hasnode(n)]

892

if len(nl) > 0:

892

if len(nl) > 0:

893

if len(nl) == 1:

893

if len(nl) == 1:

894

self._pcache[id] = nl[0]

894

self._pcache[id] = nl[0]

895

return nl[0]

895

return nl[0]

896

raise LookupError(id, self.indexfile,

896

raise LookupError(id, self.indexfile,

897

_('ambiguous identifier'))

897

_('ambiguous identifier'))

898

return None

898

return None

899

except TypeError:

899

except TypeError:

900

pass

900

pass

901

902

def lookup(self, id):

902

def lookup(self, id):

903

"""locate a node based on:

903

"""locate a node based on:

904

- revision number or str(revision number)

904

- revision number or str(revision number)

905

- nodeid or subset of hex nodeid

905

- nodeid or subset of hex nodeid

906

"""

906

"""

907

n = self._match(id)

907

n = self._match(id)

908

if n is not None:

908

if n is not None:

909

return n

909

return n

910

n = self._partialmatch(id)

910

n = self._partialmatch(id)

911

if n:

911

if n:

912

return n

912

return n

913

914

raise LookupError(id, self.indexfile, _('no match found'))

914

raise LookupError(id, self.indexfile, _('no match found'))

915

916

def cmp(self, node, text):

916

def cmp(self, node, text):

917

"""compare text with a given file revision

917

"""compare text with a given file revision

918

919

returns True if text is different than what is stored.

919

returns True if text is different than what is stored.

920

"""

920

"""

921

p1, p2 = self.parents(node)

921

p1, p2 = self.parents(node)

922

return hash(text, p1, p2) != node

922

return hash(text, p1, p2) != node

923

924

def _addchunk(self, offset, data):

924

def _addchunk(self, offset, data):

925

o, d = self._chunkcache

925

o, d = self._chunkcache

926

# try to add to existing cache

926

# try to add to existing cache

927

if o + len(d) == offset and len(d) + len(data) < _chunksize:

927

if o + len(d) == offset and len(d) + len(data) < _chunksize:

928

self._chunkcache = o, d + data

928

self._chunkcache = o, d + data

929

else:

929

else:

930

self._chunkcache = offset, data

930

self._chunkcache = offset, data

931

932

def _loadchunk(self, offset, length):

932

def _loadchunk(self, offset, length):

933

if self._inline:

933

if self._inline:

934

df = self.opener(self.indexfile)

934

df = self.opener(self.indexfile)

935

else:

935

else:

936

df = self.opener(self.datafile)

936

df = self.opener(self.datafile)

937

938

# Cache data both forward and backward around the requested

938

# Cache data both forward and backward around the requested

939

# data, in a fixed size window. This helps speed up operations

939

# data, in a fixed size window. This helps speed up operations

940

# involving reading the revlog backwards.

940

# involving reading the revlog backwards.

941

cachesize = self._chunkcachesize

941

cachesize = self._chunkcachesize

942

realoffset = offset & ~(cachesize - 1)

942

realoffset = offset & ~(cachesize - 1)

943

reallength = (((offset + length + cachesize) & ~(cachesize - 1))

943

reallength = (((offset + length + cachesize) & ~(cachesize - 1))

944

- realoffset)

944

- realoffset)

945

df.seek(realoffset)

945

df.seek(realoffset)

946

d = df.read(reallength)

946

d = df.read(reallength)

947

df.close()

947

df.close()

948

self._addchunk(realoffset, d)

948

self._addchunk(realoffset, d)

949

if offset != realoffset or reallength != length:

949

if offset != realoffset or reallength != length:

950

return util.buffer(d, offset - realoffset, length)

950

return util.buffer(d, offset - realoffset, length)

951

return d

951

return d

952

953

def _getchunk(self, offset, length):

953

def _getchunk(self, offset, length):

954

o, d = self._chunkcache

954

o, d = self._chunkcache

955

l = len(d)

955

l = len(d)

956

957

# is it in the cache?

957

# is it in the cache?

958

cachestart = offset - o

958

cachestart = offset - o

959

cacheend = cachestart + length

959

cacheend = cachestart + length

960

if cachestart >= 0 and cacheend <= l:

960

if cachestart >= 0 and cacheend <= l:

961

if cachestart == 0 and cacheend == l:

961

if cachestart == 0 and cacheend == l:

962

return d # avoid a copy

962

return d # avoid a copy

963

return util.buffer(d, cachestart, cacheend - cachestart)

963

return util.buffer(d, cachestart, cacheend - cachestart)

964

965

return self._loadchunk(offset, length)

965

return self._loadchunk(offset, length)

966

967

def _chunkraw(self, startrev, endrev):

967

def _chunkraw(self, startrev, endrev):

968

start = self.start(startrev)

968

start = self.start(startrev)

969

end = self.end(endrev)

969

end = self.end(endrev)

970

if self._inline:

970

if self._inline:

971

start += (startrev + 1) * self._io.size

971

start += (startrev + 1) * self._io.size

972

end += (endrev + 1) * self._io.size

972

end += (endrev + 1) * self._io.size

973

length = end - start

973

length = end - start

974

return self._getchunk(start, length)

974

return self._getchunk(start, length)

975

976

def _chunk(self, rev):

976

def _chunk(self, rev):

977

return decompress(self._chunkraw(rev, rev))

977

return decompress(self._chunkraw(rev, rev))

978

979

def _chunks(self, revs):

979

def _chunks(self, revs):

980

'''faster version of [self._chunk(rev) for rev in revs]

980

'''faster version of [self._chunk(rev) for rev in revs]

981

982

Assumes that revs is in ascending order.'''

982

Assumes that revs is in ascending order.'''

983

if not revs:

983

if not revs:

984

return []

984

return []

985

start = self.start

985

start = self.start

986

length = self.length

986

length = self.length

987

inline = self._inline

987

inline = self._inline

988

iosize = self._io.size

988

iosize = self._io.size

989

buffer = util.buffer

989

buffer = util.buffer

990

991

l = []

991

l = []

992

ladd = l.append

992

ladd = l.append

993

994

# preload the cache

994

# preload the cache

995

try:

995

try:

996

while True:

996

while True:

997

# ensure that the cache doesn't change out from under us

997

# ensure that the cache doesn't change out from under us

998

_cache = self._chunkcache

998

_cache = self._chunkcache

999

self._chunkraw(revs[0], revs[-1])

999

self._chunkraw(revs[0], revs[-1])

1000

if _cache == self._chunkcache:

1000

if _cache == self._chunkcache:

1001

break

1001

break

1002

offset, data = _cache

1002

offset, data = _cache

1003

except OverflowError:

1003

except OverflowError:

1004

# issue4215 - we can't cache a run of chunks greater than

1004

# issue4215 - we can't cache a run of chunks greater than

1005

# 2G on Windows

1005

# 2G on Windows

1006

return [self._chunk(rev) for rev in revs]

1006

return [self._chunk(rev) for rev in revs]

1007

1008

for rev in revs:

1008

for rev in revs:

1009

chunkstart = start(rev)

1009

chunkstart = start(rev)

1010

if inline:

1010

if inline:

1011

chunkstart += (rev + 1) * iosize

1011

chunkstart += (rev + 1) * iosize

1012

chunklength = length(rev)

1012

chunklength = length(rev)

1013

ladd(decompress(buffer(data, chunkstart - offset, chunklength)))

1013

ladd(decompress(buffer(data, chunkstart - offset, chunklength)))

1014

1015

return l

1015

return l

1016

1017

def _chunkclear(self):

1017

def _chunkclear(self):

1018

self._chunkcache = (0, '')

1018

self._chunkcache = (0, '')

1019

1020

def deltaparent(self, rev):

1020

def deltaparent(self, rev):

1021

"""return deltaparent of the given revision"""

1021

"""return deltaparent of the given revision"""

1022

base = self.index[rev][3]

1022

base = self.index[rev][3]

1023

if base == rev:

1023

if base == rev:

1024

return nullrev

1024

return nullrev

1025

elif self._generaldelta:

1025

elif self._generaldelta:

1026

return base

1026

return base

1027

else:

1027

else:

1028

return rev - 1

1028

return rev - 1

1029

1030

def revdiff(self, rev1, rev2):

1030

def revdiff(self, rev1, rev2):

1031

"""return or calculate a delta between two revisions"""

1031

"""return or calculate a delta between two revisions"""

1032

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

1032

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

1033

return str(self._chunk(rev2))

1033

return str(self._chunk(rev2))

1034

1035

return mdiff.textdiff(self.revision(rev1),

1035

return mdiff.textdiff(self.revision(rev1),

1036

self.revision(rev2))

1036

self.revision(rev2))

1037

1038

def revision(self, nodeorrev):

1038

def revision(self, nodeorrev):

1039

"""return an uncompressed revision of a given node or revision

1039

"""return an uncompressed revision of a given node or revision

1040

number.

1040

number.

1041

"""

1041

"""

1042

if isinstance(nodeorrev, int):

1042

if isinstance(nodeorrev, int):

1043

rev = nodeorrev

1043

rev = nodeorrev

1044

node = self.node(rev)

1044

node = self.node(rev)

1045

else:

1045

else:

1046

node = nodeorrev

1046

node = nodeorrev

1047

rev = None

1047

rev = None

1048

1049

_cache = self._cache # grab local copy of cache to avoid thread race

1049

_cache = self._cache # grab local copy of cache to avoid thread race

1050

cachedrev = None

1050

cachedrev = None

1051

if node == nullid:

1051

if node == nullid:

1052

return ""

1052

return ""

1053

if _cache:

1053

if _cache:

1054

if _cache[0] == node:

1054

if _cache[0] == node:

1055

return _cache[2]

1055

return _cache[2]

1056

cachedrev = _cache[1]

1056

cachedrev = _cache[1]

1057

1058

# look up what we need to read

1058

# look up what we need to read

1059

text = None

1059

text = None

1060

if rev is None:

1060

if rev is None:

1061

rev = self.rev(node)

1061

rev = self.rev(node)

1062

1063

# check rev flags

1063

# check rev flags

1064

if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:

1064

if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:

1065

raise RevlogError(_('incompatible revision flag %x') %

1065

raise RevlogError(_('incompatible revision flag %x') %

1066

(self.flags(rev) & ~REVIDX_KNOWN_FLAGS))

1066

(self.flags(rev) & ~REVIDX_KNOWN_FLAGS))

1067

1068

# build delta chain

1068

# build delta chain

1069

chain = []

1069

chain = []

1070

index = self.index # for performance

1070

index = self.index # for performance

1071

generaldelta = self._generaldelta

1071

generaldelta = self._generaldelta

1072

iterrev = rev

1072

iterrev = rev

1073

e = index[iterrev]

1073

e = index[iterrev]

1074

while iterrev != e[3] and iterrev != cachedrev:

1074

while iterrev != e[3] and iterrev != cachedrev:

1075

chain.append(iterrev)

1075

chain.append(iterrev)

1076

if generaldelta:

1076

if generaldelta:

1077

iterrev = e[3]

1077

iterrev = e[3]

1078

else:

1078

else:

1079

iterrev -= 1

1079

iterrev -= 1

1080

e = index[iterrev]

1080

e = index[iterrev]

1081

1082

if iterrev == cachedrev:

1082

if iterrev == cachedrev:

1083

# cache hit

1083

# cache hit

1084

text = _cache[2]

1084

text = _cache[2]

1085

else:

1085

else:

1086

chain.append(iterrev)

1086

chain.append(iterrev)

1087

chain.reverse()

1087

chain.reverse()

1088

1089

# drop cache to save memory

1089

# drop cache to save memory

1090

self._cache = None

1090

self._cache = None

1091

1092

bins = self._chunks(chain)

1092

bins = self._chunks(chain)

1093

if text is None:

1093

if text is None:

1094

text = str(bins[0])

1094

text = str(bins[0])

1095

bins = bins[1:]

1095

bins = bins[1:]

1096

1097

text = mdiff.patches(text, bins)

1097

text = mdiff.patches(text, bins)

1098

1099

text = self._checkhash(text, node, rev)

1099

text = self._checkhash(text, node, rev)

1100

1101

self._cache = (node, rev, text)

1101

self._cache = (node, rev, text)

1102

return text

1102

return text

1103

1104

def hash(self, text, p1, p2):

1104

def hash(self, text, p1, p2):

1105

"""Compute a node hash.

1105

"""Compute a node hash.

1106

1107

Available as a function so that subclasses can replace the hash

1107

Available as a function so that subclasses can replace the hash

1108

as needed.

1108

as needed.

1109

"""

1109

"""

1110

return hash(text, p1, p2)

1110

return hash(text, p1, p2)

1111

1112

def _checkhash(self, text, node, rev):

1112

def _checkhash(self, text, node, rev):

1113

p1, p2 = self.parents(node)

1113

p1, p2 = self.parents(node)

1114

self.checkhash(text, p1, p2, node, rev)

1114

self.checkhash(text, p1, p2, node, rev)

1115

return text

1115

return text

1116

1117

def checkhash(self, text, p1, p2, node, rev=None):

1117

def checkhash(self, text, p1, p2, node, rev=None):

1118

if node != self.hash(text, p1, p2):

1118

if node != self.hash(text, p1, p2):

1119

revornode = rev

1119

revornode = rev

1120

if revornode is None:

1120

if revornode is None:

1121

revornode = templatefilters.short(hex(node))

1121

revornode = templatefilters.short(hex(node))

1122

raise RevlogError(_("integrity check failed on %s:%s")

1122

raise RevlogError(_("integrity check failed on %s:%s")

1123

% (self.indexfile, revornode))

1123

% (self.indexfile, revornode))

1124

1125

def checkinlinesize(self, tr, fp=None):

1125

def checkinlinesize(self, tr, fp=None):

1126

if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:

1126

if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:

1127

return

1127

return

1128

1129

trinfo = tr.find(self.indexfile)

1129

trinfo = tr.find(self.indexfile)

1130

if trinfo is None:

1130

if trinfo is None:

1131

raise RevlogError(_("%s not found in the transaction")

1131

raise RevlogError(_("%s not found in the transaction")

1132

% self.indexfile)

1132

% self.indexfile)

1133

1134

trindex = trinfo[2]

1134

trindex = trinfo[2]

1135

if trindex is not None:

1135

if trindex is not None:

1136

dataoff = self.start(trindex)

1136

dataoff = self.start(trindex)

1137

else:

1137

else:

1138

# revlog was stripped at start of transaction, use all leftover data

1138

# revlog was stripped at start of transaction, use all leftover data

1139

trindex = len(self) - 1

1139

trindex = len(self) - 1

1140

dataoff = self.end(-2)

1140

dataoff = self.end(-2)

1141

1142

tr.add(self.datafile, dataoff)

1142

tr.add(self.datafile, dataoff)

1143

1144

if fp:

1144

if fp:

1145

fp.flush()

1145

fp.flush()

1146

fp.close()

1146

fp.close()

1147

1148

df = self.opener(self.datafile, 'w')

1148

df = self.opener(self.datafile, 'w')

1149

try:

1149

try:

1150

for r in self:

1150

for r in self:

1151

df.write(self._chunkraw(r, r))

1151

df.write(self._chunkraw(r, r))

1152

finally:

1152

finally:

1153

df.close()

1153

df.close()

1154

1155

fp = self.opener(self.indexfile, 'w', atomictemp=True)

1155

fp = self.opener(self.indexfile, 'w', atomictemp=True)

1156

self.version &= ~(REVLOGNGINLINEDATA)

1156

self.version &= ~(REVLOGNGINLINEDATA)

1157

self._inline = False

1157

self._inline = False

1158

for i in self:

1158

for i in self:

1159

e = self._io.packentry(self.index[i], self.node, self.version, i)

1159

e = self._io.packentry(self.index[i], self.node, self.version, i)

1160

fp.write(e)

1160

fp.write(e)

1161

1162

# if we don't call close, the temp file will never replace the

1162

# if we don't call close, the temp file will never replace the

1163

# real index

1163

# real index

1164

fp.close()

1164

fp.close()

1165

1166

tr.replace(self.indexfile, trindex * self._io.size)

1166

tr.replace(self.indexfile, trindex * self._io.size)

1167

self._chunkclear()

1167

self._chunkclear()

1168

1169

def addrevision(self, text, transaction, link, p1, p2, cachedelta=None,

1169

def addrevision(self, text, transaction, link, p1, p2, cachedelta=None,

1170

node=None):

1170

node=None):

1171

"""add a revision to the log

1171

"""add a revision to the log

1172

1173

text - the revision data to add

1173

text - the revision data to add

1174

transaction - the transaction object used for rollback

1174

transaction - the transaction object used for rollback

1175

link - the linkrev data to add

1175

link - the linkrev data to add

1176

p1, p2 - the parent nodeids of the revision

1176

p1, p2 - the parent nodeids of the revision

1177

cachedelta - an optional precomputed delta

1177

cachedelta - an optional precomputed delta

1178

node - nodeid of revision; typically node is not specified, and it is

1178

node - nodeid of revision; typically node is not specified, and it is

1179

computed by default as hash(text, p1, p2), however subclasses might

1179

computed by default as hash(text, p1, p2), however subclasses might

1180

use different hashing method (and override checkhash() in such case)

1180

use different hashing method (and override checkhash() in such case)

1181

"""

1181

"""

1182

if link == nullrev:

1182

if link == nullrev:

1183

raise RevlogError(_("attempted to add linkrev -1 to %s")

1183

raise RevlogError(_("attempted to add linkrev -1 to %s")

1184

% self.indexfile)

1184

% self.indexfile)

1185

1186

if len(text) > _maxentrysize:

1186

if len(text) > _maxentrysize:

1187

raise RevlogError(

1187

raise RevlogError(

1188

_("%s: size of %d bytes exceeds maximum revlog storage of 2GiB")

1188

_("%s: size of %d bytes exceeds maximum revlog storage of 2GiB")

1189

% (self.indexfile, len(text)))

1189

% (self.indexfile, len(text)))

1190

1191

node = node or self.hash(text, p1, p2)

1191

node = node or self.hash(text, p1, p2)

1192

if node in self.nodemap:

1192

if node in self.nodemap:

1193

return node

1193

return node

1194

1195

dfh = None

1195

dfh = None

1196

if not self._inline:

1196

if not self._inline:

1197

dfh = self.opener(self.datafile, "a")

1197

dfh = self.opener(self.datafile, "a")

1198

ifh = self.opener(self.indexfile, "a+")

1198

ifh = self.opener(self.indexfile, "a+")

1199

try:

1199

try:

1200

return self._addrevision(node, text, transaction, link, p1, p2,

1200

return self._addrevision(node, text, transaction, link, p1, p2,

1201

REVIDX_DEFAULT_FLAGS, cachedelta, ifh, dfh)

1201

REVIDX_DEFAULT_FLAGS, cachedelta, ifh, dfh)

1202

finally:

1202

finally:

1203

if dfh:

1203

if dfh:

1204

dfh.close()

1204

dfh.close()

1205

ifh.close()

1205

ifh.close()

1206

1207

def compress(self, text):

1207

def compress(self, text):

1208

""" generate a possibly-compressed representation of text """

1208

""" generate a possibly-compressed representation of text """

1209

if not text:

1209

if not text:

1210

return ("", text)

1210

return ("", text)

1211

l = len(text)

1211

l = len(text)

1212

bin = None

1212

bin = None

1213

if l < 44:

1213

if l < 44:

1214

pass

1214

pass

1215

elif l > 1000000:

1215

elif l > 1000000:

1216

# zlib makes an internal copy, thus doubling memory usage for

1216

# zlib makes an internal copy, thus doubling memory usage for

1217

# large files, so lets do this in pieces

1217

# large files, so lets do this in pieces

1218

z = zlib.compressobj()

1218

z = zlib.compressobj()

1219

p = []

1219

p = []

1220

pos = 0

1220

pos = 0

1221

while pos < l:

1221

while pos < l:

1222

pos2 = pos + 2**20

1222

pos2 = pos + 2**20

1223

p.append(z.compress(text[pos:pos2]))

1223

p.append(z.compress(text[pos:pos2]))

1224

pos = pos2

1224

pos = pos2

1225

p.append(z.flush())

1225

p.append(z.flush())

1226

if sum(map(len, p)) < l:

1226

if sum(map(len, p)) < l:

1227

bin = "".join(p)

1227

bin = "".join(p)

1228

else:

1228

else:

1229

bin = _compress(text)

1229

bin = _compress(text)

1230

if bin is None or len(bin) > l:

1230

if bin is None or len(bin) > l:

1231

if text[0] == '\0':

1231

if text[0] == '\0':

1232

return ("", text)

1232

return ("", text)

1233

return ('u', text)

1233

return ('u', text)

1234

return ("", bin)

1234

return ("", bin)

1235

1236

def _isgooddelta(self, d, textlen):

1236

def _isgooddelta(self, d, textlen):

1237

"""Returns True if the given delta is good. Good means that it is within

1237

"""Returns True if the given delta is good. Good means that it is within

1238

the disk span, disk size, and chain length bounds that we know to be

1238

the disk span, disk size, and chain length bounds that we know to be

1239

performant."""

1239

performant."""

1240

if d is None:

1240

if d is None:

1241

return False

1241

return False

1242

1243

# - 'dist' is the distance from the base revision -- bounding it limits

1243

# - 'dist' is the distance from the base revision -- bounding it limits

1244

# the amount of I/O we need to do.

1244

# the amount of I/O we need to do.

1245

# - 'compresseddeltalen' is the sum of the total size of deltas we need

1245

# - 'compresseddeltalen' is the sum of the total size of deltas we need

1246

# to apply -- bounding it limits the amount of CPU we consume.

1246

# to apply -- bounding it limits the amount of CPU we consume.

1247

dist, l, data, base, chainbase, chainlen, compresseddeltalen = d

1247

dist, l, data, base, chainbase, chainlen, compresseddeltalen = d

1248

if (dist > textlen * 4 or l > textlen or

1248

if (dist > textlen * 4 or l > textlen or

1249

compresseddeltalen > textlen * 2 or

1249

compresseddeltalen > textlen * 2 or

1250

(self._maxchainlen and chainlen > self._maxchainlen)):

1250

(self._maxchainlen and chainlen > self._maxchainlen)):

1251

return False

1251

return False

1252

1253

return True

1253

return True

1254

1255

def _addrevision(self, node, text, transaction, link, p1, p2, flags,

1255

def _addrevision(self, node, text, transaction, link, p1, p2, flags,

1256

cachedelta, ifh, dfh):

1256

cachedelta, ifh, dfh):

1257

"""internal function to add revisions to the log

1257

"""internal function to add revisions to the log

1258

1259

see addrevision for argument descriptions.

1259

see addrevision for argument descriptions.

1260

invariants:

1260

invariants:

1261

- text is optional (can be None); if not set, cachedelta must be set.

1261

- text is optional (can be None); if not set, cachedelta must be set.

1262

if both are set, they must correspond to each other.

1262

if both are set, they must correspond to each other.

1263

"""

1263

"""

1264

btext = [text]

1264

btext = [text]

1265

def buildtext():

1265

def buildtext():

1266

if btext[0] is not None:

1266

if btext[0] is not None:

1267

return btext[0]

1267

return btext[0]

1268

# flush any pending writes here so we can read it in revision

1268

# flush any pending writes here so we can read it in revision

1269

if dfh:

1269

if dfh:

1270

dfh.flush()

1270

dfh.flush()

1271

ifh.flush()

1271

ifh.flush()

1272

baserev = cachedelta[0]

1272

baserev = cachedelta[0]

1273

delta = cachedelta[1]

1273

delta = cachedelta[1]

1274

# special case deltas which replace entire base; no need to decode

1274

# special case deltas which replace entire base; no need to decode

1275

# base revision. this neatly avoids censored bases, which throw when

1275

# base revision. this neatly avoids censored bases, which throw when

1276

# they're decoded.

1276

# they're decoded.

1277

hlen = struct.calcsize(">lll")

1277

hlen = struct.calcsize(">lll")

1278

if delta[:hlen] == mdiff.replacediffheader(self.rawsize(baserev),

1278

if delta[:hlen] == mdiff.replacediffheader(self.rawsize(baserev),

1279

len(delta) - hlen):

1279

len(delta) - hlen):

1280

btext[0] = delta[hlen:]

1280

btext[0] = delta[hlen:]

1281

else:

1281

else:

1282

basetext = self.revision(self.node(baserev))

1282

basetext = self.revision(self.node(baserev))

1283

btext[0] = mdiff.patch(basetext, delta)

1283

btext[0] = mdiff.patch(basetext, delta)

1284

try:

1284

try:

1285

self.checkhash(btext[0], p1, p2, node)

1285

self.checkhash(btext[0], p1, p2, node)

1286

if flags & REVIDX_ISCENSORED:

1286

if flags & REVIDX_ISCENSORED:

1287

raise RevlogError(_('node %s is not censored') % node)

1287

raise RevlogError(_('node %s is not censored') % node)

1288

except CensoredNodeError:

1288

except CensoredNodeError:

1289

# must pass the censored index flag to add censored revisions

1289

# must pass the censored index flag to add censored revisions

1290

if not flags & REVIDX_ISCENSORED:

1290

if not flags & REVIDX_ISCENSORED:

1291

raise

1291

raise

1292

return btext[0]

1292

return btext[0]

1293

1294

def builddelta(rev):

1294

def builddelta(rev):

1295

# can we use the cached delta?

1295

# can we use the cached delta?

1296

if cachedelta and cachedelta[0] == rev:

1296

if cachedelta and cachedelta[0] == rev:

1297

delta = cachedelta[1]

1297

delta = cachedelta[1]

1298

else:

1298

else:

1299

t = buildtext()

1299

t = buildtext()

1300

if self.iscensored(rev):

1300

if self.iscensored(rev):

1301

# deltas based on a censored revision must replace the

1301

# deltas based on a censored revision must replace the

1302

# full content in one patch, so delta works everywhere

1302

# full content in one patch, so delta works everywhere

1303

header = mdiff.replacediffheader(self.rawsize(rev), len(t))

1303

header = mdiff.replacediffheader(self.rawsize(rev), len(t))

1304

delta = header + t

1304

delta = header + t

1305

else:

1305

else:

1306

ptext = self.revision(self.node(rev))

1306

ptext = self.revision(self.node(rev))

1307

delta = mdiff.textdiff(ptext, t)

1307

delta = mdiff.textdiff(ptext, t)

1308

data = self.compress(delta)

1308

data = self.compress(delta)

1309

l = len(data[1]) + len(data[0])

1309

l = len(data[1]) + len(data[0])

1310

if basecache[0] == rev:

1310

if basecache[0] == rev:

1311

chainbase = basecache[1]

1311

chainbase = basecache[1]

1312

else:

1312

else:

1313

chainbase = self.chainbase(rev)

1313

chainbase = self.chainbase(rev)

1314

dist = l + offset - self.start(chainbase)

1314

dist = l + offset - self.start(chainbase)

1315

if self._generaldelta:

1315

if self._generaldelta:

1316

base = rev

1316

base = rev

1317

else:

1317

else:

1318

base = chainbase

1318

base = chainbase

1319

chainlen, compresseddeltalen = self._chaininfo(rev)

1319

chainlen, compresseddeltalen = self._chaininfo(rev)

1320

chainlen += 1

1320

chainlen += 1

1321

compresseddeltalen += l

1321

compresseddeltalen += l

1322

return dist, l, data, base, chainbase, chainlen, compresseddeltalen

1322

return dist, l, data, base, chainbase, chainlen, compresseddeltalen

1323

1324

curr = len(self)

1324

curr = len(self)

1325

prev = curr - 1

1325

prev = curr - 1

1326

base = chainbase = curr

1326

base = chainbase = curr

1327

chainlen = None

1327

chainlen = None

1328

offset = self.end(prev)

1328

offset = self.end(prev)

1329

d = None

1329

d = None

1330

if self._basecache is None:

1330

if self._basecache is None:

1331

self._basecache = (prev, self.chainbase(prev))

1331

self._basecache = (prev, self.chainbase(prev))

1332

basecache = self._basecache

1332

basecache = self._basecache

1333

p1r, p2r = self.rev(p1), self.rev(p2)

1333

p1r, p2r = self.rev(p1), self.rev(p2)

1334

1335

# full versions are inserted when the needed deltas

1335

# full versions are inserted when the needed deltas

1336

# become comparable to the uncompressed text

1336

# become comparable to the uncompressed text

1337

if text is None:

1337

if text is None:

1338

textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),

1338

textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),

1339

cachedelta[1])

1339

cachedelta[1])

1340

else:

1340

else:

1341

textlen = len(text)

1341

textlen = len(text)

1342

1343

# should we try to build a delta?

1343

# should we try to build a delta?

1344

if prev != nullrev:

1344

if prev != nullrev:

1345

if self._generaldelta:

1345

if self._generaldelta:

1346

if p1r >= basecache[1]:

1346

# Pick whichever parent is closer to us (to minimize the

1347

d = builddelta(p1r)

1347

# chance of having to build a fulltext). Since

1348

elif p2r >= basecache[1]:

1348

# nullrev == -1, any non-merge commit will always pick p1r.

1349

d = builddelta(p2r)

1349

drev = p2r if p2r > p1r else p1r

1350

~~else~~:

1350

d = builddelta(drev)

1351

# If the chosen delta will result in us making a full text,

1352

# give it one last try against prev.

1353

if drev != prev and not self._isgooddelta(d, textlen):

1351

d = builddelta(prev)

1354

d = builddelta(prev)

1352

else:

1355

else:

1353

d = builddelta(prev)

1356

d = builddelta(prev)

1354

dist, l, data, base, chainbase, chainlen, compresseddeltalen = d

1357

dist, l, data, base, chainbase, chainlen, compresseddeltalen = d

1355

1358

1356

if not self._isgooddelta(d, textlen):

1359

if not self._isgooddelta(d, textlen):

1357

text = buildtext()

1360

text = buildtext()

1358

data = self.compress(text)

1361

data = self.compress(text)

1359

l = len(data[1]) + len(data[0])

1362

l = len(data[1]) + len(data[0])

1360

base = chainbase = curr

1363

base = chainbase = curr

1361

1364

1362

e = (offset_type(offset, flags), l, textlen,

1365

e = (offset_type(offset, flags), l, textlen,

1363

base, link, p1r, p2r, node)

1366

base, link, p1r, p2r, node)

1364

self.index.insert(-1, e)

1367

self.index.insert(-1, e)

1365

self.nodemap[node] = curr

1368

self.nodemap[node] = curr

1366

1369

1367

entry = self._io.packentry(e, self.node, self.version, curr)

1370

entry = self._io.packentry(e, self.node, self.version, curr)

1368

self._writeentry(transaction, ifh, dfh, entry, data, link, offset)

1371

self._writeentry(transaction, ifh, dfh, entry, data, link, offset)

1369

1372

1370

if type(text) == str: # only accept immutable objects

1373

if type(text) == str: # only accept immutable objects

1371

self._cache = (node, curr, text)

1374

self._cache = (node, curr, text)

1372

self._basecache = (curr, chainbase)

1375

self._basecache = (curr, chainbase)

1373

return node

1376

return node

1374

1377

1375

def _writeentry(self, transaction, ifh, dfh, entry, data, link, offset):

1378

def _writeentry(self, transaction, ifh, dfh, entry, data, link, offset):

1376

curr = len(self) - 1

1379

curr = len(self) - 1

1377

if not self._inline:

1380

if not self._inline:

1378

transaction.add(self.datafile, offset)

1381

transaction.add(self.datafile, offset)

1379

transaction.add(self.indexfile, curr * len(entry))

1382

transaction.add(self.indexfile, curr * len(entry))

1380

if data[0]:

1383

if data[0]:

1381

dfh.write(data[0])

1384

dfh.write(data[0])

1382

dfh.write(data[1])

1385

dfh.write(data[1])

1383

dfh.flush()

1386

dfh.flush()

1384

ifh.write(entry)

1387

ifh.write(entry)

1385

else:

1388

else:

1386

offset += curr * self._io.size

1389

offset += curr * self._io.size

1387

transaction.add(self.indexfile, offset, curr)

1390

transaction.add(self.indexfile, offset, curr)

1388

ifh.write(entry)

1391

ifh.write(entry)

1389

ifh.write(data[0])

1392

ifh.write(data[0])

1390

ifh.write(data[1])

1393

ifh.write(data[1])

1391

self.checkinlinesize(transaction, ifh)

1394

self.checkinlinesize(transaction, ifh)

1392

1395

1393

def addgroup(self, bundle, linkmapper, transaction, addrevisioncb=None):

1396

def addgroup(self, bundle, linkmapper, transaction, addrevisioncb=None):

1394

"""

1397

"""

1395

add a delta group

1398

add a delta group

1396

1399

1397

given a set of deltas, add them to the revision log. the

1400

given a set of deltas, add them to the revision log. the

1398

first delta is against its parent, which should be in our

1401

first delta is against its parent, which should be in our

1399

log, the rest are against the previous delta.

1402

log, the rest are against the previous delta.

1400

1403

1401

If ``addrevisioncb`` is defined, it will be called with arguments of

1404

If ``addrevisioncb`` is defined, it will be called with arguments of

1402

this revlog and the node that was added.

1405

this revlog and the node that was added.

1403

"""

1406

"""

1404

1407

1405

# track the base of the current delta log

1408

# track the base of the current delta log

1406

content = []

1409

content = []

1407

node = None

1410

node = None

1408

1411

1409

r = len(self)

1412

r = len(self)

1410

end = 0

1413

end = 0

1411

if r:

1414

if r:

1412

end = self.end(r - 1)

1415

end = self.end(r - 1)

1413

ifh = self.opener(self.indexfile, "a+")

1416

ifh = self.opener(self.indexfile, "a+")

1414

isize = r * self._io.size

1417

isize = r * self._io.size

1415

if self._inline:

1418

if self._inline:

1416

transaction.add(self.indexfile, end + isize, r)

1419

transaction.add(self.indexfile, end + isize, r)

1417

dfh = None

1420

dfh = None

1418

else:

1421

else:

1419

transaction.add(self.indexfile, isize, r)

1422

transaction.add(self.indexfile, isize, r)

1420

transaction.add(self.datafile, end)

1423

transaction.add(self.datafile, end)

1421

dfh = self.opener(self.datafile, "a")

1424

dfh = self.opener(self.datafile, "a")

1422

def flush():

1425

def flush():

1423

if dfh:

1426

if dfh:

1424

dfh.flush()

1427

dfh.flush()

1425

ifh.flush()

1428

ifh.flush()

1426

try:

1429

try:

1427

# loop through our set of deltas

1430

# loop through our set of deltas

1428

chain = None

1431

chain = None

1429

while True:

1432

while True:

1430

chunkdata = bundle.deltachunk(chain)

1433

chunkdata = bundle.deltachunk(chain)

1431

if not chunkdata:

1434

if not chunkdata:

1432

break

1435

break

1433

node = chunkdata['node']

1436

node = chunkdata['node']

1434

p1 = chunkdata['p1']

1437

p1 = chunkdata['p1']

1435

p2 = chunkdata['p2']

1438

p2 = chunkdata['p2']

1436

cs = chunkdata['cs']

1439

cs = chunkdata['cs']

1437

deltabase = chunkdata['deltabase']

1440

deltabase = chunkdata['deltabase']

1438

delta = chunkdata['delta']

1441

delta = chunkdata['delta']

1439

1442

1440

content.append(node)

1443

content.append(node)

1441

1444

1442

link = linkmapper(cs)

1445

link = linkmapper(cs)

1443

if node in self.nodemap:

1446

if node in self.nodemap:

1444

# this can happen if two branches make the same change

1447

# this can happen if two branches make the same change

1445

chain = node

1448

chain = node

1446

continue

1449

continue

1447

1450

1448

for p in (p1, p2):

1451

for p in (p1, p2):

1449

if p not in self.nodemap:

1452

if p not in self.nodemap:

1450

raise LookupError(p, self.indexfile,

1453

raise LookupError(p, self.indexfile,

1451

_('unknown parent'))

1454

_('unknown parent'))

1452

1455

1453

if deltabase not in self.nodemap:

1456

if deltabase not in self.nodemap:

1454

raise LookupError(deltabase, self.indexfile,

1457

raise LookupError(deltabase, self.indexfile,

1455

_('unknown delta base'))

1458

_('unknown delta base'))

1456

1459

1457

baserev = self.rev(deltabase)

1460

baserev = self.rev(deltabase)

1458

1461

1459

if baserev != nullrev and self.iscensored(baserev):

1462

if baserev != nullrev and self.iscensored(baserev):

1460

# if base is censored, delta must be full replacement in a

1463

# if base is censored, delta must be full replacement in a

1461

# single patch operation

1464

# single patch operation

1462

hlen = struct.calcsize(">lll")

1465

hlen = struct.calcsize(">lll")

1463

oldlen = self.rawsize(baserev)

1466

oldlen = self.rawsize(baserev)

1464

newlen = len(delta) - hlen

1467

newlen = len(delta) - hlen

1465

if delta[:hlen] != mdiff.replacediffheader(oldlen, newlen):

1468

if delta[:hlen] != mdiff.replacediffheader(oldlen, newlen):

1466

raise error.CensoredBaseError(self.indexfile,

1469

raise error.CensoredBaseError(self.indexfile,

1467

self.node(baserev))

1470

self.node(baserev))

1468

1471

1469

flags = REVIDX_DEFAULT_FLAGS

1472

flags = REVIDX_DEFAULT_FLAGS

1470

if self._peek_iscensored(baserev, delta, flush):

1473

if self._peek_iscensored(baserev, delta, flush):

1471

flags |= REVIDX_ISCENSORED

1474

flags |= REVIDX_ISCENSORED

1472

1475

1473

chain = self._addrevision(node, None, transaction, link,

1476

chain = self._addrevision(node, None, transaction, link,

1474

p1, p2, flags, (baserev, delta),

1477

p1, p2, flags, (baserev, delta),

1475

ifh, dfh)

1478

ifh, dfh)

1476

1479

1477

if addrevisioncb:

1480

if addrevisioncb:

1478

# Data for added revision can't be read unless flushed

1481

# Data for added revision can't be read unless flushed

1479

# because _loadchunk always opensa new file handle and

1482

# because _loadchunk always opensa new file handle and

1480

# there is no guarantee data was actually written yet.

1483

# there is no guarantee data was actually written yet.

1481

flush()

1484

flush()

1482

addrevisioncb(self, chain)

1485

addrevisioncb(self, chain)

1483

1486

1484

if not dfh and not self._inline:

1487

if not dfh and not self._inline:

1485

# addrevision switched from inline to conventional

1488

# addrevision switched from inline to conventional

1486

# reopen the index

1489

# reopen the index

1487

ifh.close()

1490

ifh.close()

1488

dfh = self.opener(self.datafile, "a")

1491

dfh = self.opener(self.datafile, "a")

1489

ifh = self.opener(self.indexfile, "a")

1492

ifh = self.opener(self.indexfile, "a")

1490

finally:

1493

finally:

1491

if dfh:

1494

if dfh:

1492

dfh.close()

1495

dfh.close()

1493

ifh.close()

1496

ifh.close()

1494

1497

1495

return content

1498

return content

1496

1499

1497

def iscensored(self, rev):

1500

def iscensored(self, rev):

1498

"""Check if a file revision is censored."""

1501

"""Check if a file revision is censored."""

1499

return False

1502

return False

1500

1503

1501

def _peek_iscensored(self, baserev, delta, flush):

1504

def _peek_iscensored(self, baserev, delta, flush):

1502

"""Quickly check if a delta produces a censored revision."""

1505

"""Quickly check if a delta produces a censored revision."""

1503

return False

1506

return False

1504

1507

1505

def getstrippoint(self, minlink):

1508

def getstrippoint(self, minlink):

1506

"""find the minimum rev that must be stripped to strip the linkrev

1509

"""find the minimum rev that must be stripped to strip the linkrev

1507

1510

1508

Returns a tuple containing the minimum rev and a set of all revs that

1511

Returns a tuple containing the minimum rev and a set of all revs that

1509

have linkrevs that will be broken by this strip.

1512

have linkrevs that will be broken by this strip.

1510

"""

1513

"""

1511

brokenrevs = set()

1514

brokenrevs = set()

1512

strippoint = len(self)

1515

strippoint = len(self)

1513

1516

1514

heads = {}

1517

heads = {}

1515

futurelargelinkrevs = set()

1518

futurelargelinkrevs = set()

1516

for head in self.headrevs():

1519

for head in self.headrevs():

1517

headlinkrev = self.linkrev(head)

1520

headlinkrev = self.linkrev(head)

1518

heads[head] = headlinkrev

1521

heads[head] = headlinkrev

1519

if headlinkrev >= minlink:

1522

if headlinkrev >= minlink:

1520

futurelargelinkrevs.add(headlinkrev)

1523

futurelargelinkrevs.add(headlinkrev)

1521

1524

1522

# This algorithm involves walking down the rev graph, starting at the

1525

# This algorithm involves walking down the rev graph, starting at the

1523

# heads. Since the revs are topologically sorted according to linkrev,

1526

# heads. Since the revs are topologically sorted according to linkrev,

1524

# once all head linkrevs are below the minlink, we know there are

1527

# once all head linkrevs are below the minlink, we know there are

1525

# no more revs that could have a linkrev greater than minlink.

1528

# no more revs that could have a linkrev greater than minlink.

1526

# So we can stop walking.

1529

# So we can stop walking.

1527

while futurelargelinkrevs:

1530

while futurelargelinkrevs:

1528

strippoint -= 1

1531

strippoint -= 1

1529

linkrev = heads.pop(strippoint)

1532

linkrev = heads.pop(strippoint)

1530

1533

1531

if linkrev < minlink:

1534

if linkrev < minlink:

1532

brokenrevs.add(strippoint)

1535

brokenrevs.add(strippoint)

1533

else:

1536

else:

1534

futurelargelinkrevs.remove(linkrev)

1537

futurelargelinkrevs.remove(linkrev)

1535

1538

1536

for p in self.parentrevs(strippoint):

1539

for p in self.parentrevs(strippoint):

1537

if p != nullrev:

1540

if p != nullrev:

1538

plinkrev = self.linkrev(p)

1541

plinkrev = self.linkrev(p)

1539

heads[p] = plinkrev

1542

heads[p] = plinkrev

1540

if plinkrev >= minlink:

1543

if plinkrev >= minlink:

1541

futurelargelinkrevs.add(plinkrev)

1544

futurelargelinkrevs.add(plinkrev)

1542

1545

1543

return strippoint, brokenrevs

1546

return strippoint, brokenrevs

1544

1547

1545

def strip(self, minlink, transaction):

1548

def strip(self, minlink, transaction):

1546

"""truncate the revlog on the first revision with a linkrev >= minlink

1549

"""truncate the revlog on the first revision with a linkrev >= minlink

1547

1550

1548

This function is called when we're stripping revision minlink and

1551

This function is called when we're stripping revision minlink and

1549

its descendants from the repository.

1552

its descendants from the repository.

1550

1553

1551

We have to remove all revisions with linkrev >= minlink, because

1554

We have to remove all revisions with linkrev >= minlink, because

1552

the equivalent changelog revisions will be renumbered after the

1555

the equivalent changelog revisions will be renumbered after the

1553

strip.

1556

strip.

1554

1557

1555

So we truncate the revlog on the first of these revisions, and

1558

So we truncate the revlog on the first of these revisions, and

1556

trust that the caller has saved the revisions that shouldn't be

1559

trust that the caller has saved the revisions that shouldn't be

1557

removed and that it'll re-add them after this truncation.

1560

removed and that it'll re-add them after this truncation.

1558

"""

1561

"""

1559

if len(self) == 0:

1562

if len(self) == 0:

1560

return

1563

return

1561

1564

1562

rev, _ = self.getstrippoint(minlink)

1565

rev, _ = self.getstrippoint(minlink)

1563

if rev == len(self):

1566

if rev == len(self):

1564

return

1567

return

1565

1568

1566

# first truncate the files on disk

1569

# first truncate the files on disk

1567

end = self.start(rev)

1570

end = self.start(rev)

1568

if not self._inline:

1571

if not self._inline:

1569

transaction.add(self.datafile, end)

1572

transaction.add(self.datafile, end)

1570

end = rev * self._io.size

1573

end = rev * self._io.size

1571

else:

1574

else:

1572

end += rev * self._io.size

1575

end += rev * self._io.size

1573

1576

1574

transaction.add(self.indexfile, end)

1577

transaction.add(self.indexfile, end)

1575

1578

1576

# then reset internal state in memory to forget those revisions

1579

# then reset internal state in memory to forget those revisions

1577

self._cache = None

1580

self._cache = None

1578

self._chaininfocache = {}

1581

self._chaininfocache = {}

1579

self._chunkclear()

1582

self._chunkclear()

1580

for x in xrange(rev, len(self)):

1583

for x in xrange(rev, len(self)):

1581

del self.nodemap[self.node(x)]

1584

del self.nodemap[self.node(x)]

1582

1585

1583

del self.index[rev:-1]

1586

del self.index[rev:-1]

1584

1587

1585

def checksize(self):

1588

def checksize(self):

1586

expected = 0

1589

expected = 0

1587

if len(self):

1590

if len(self):

1588

expected = max(0, self.end(len(self) - 1))

1591

expected = max(0, self.end(len(self) - 1))

1589

1592

1590

try:

1593

try:

1591

f = self.opener(self.datafile)

1594

f = self.opener(self.datafile)

1592

f.seek(0, 2)

1595

f.seek(0, 2)

1593

actual = f.tell()

1596

actual = f.tell()

1594

f.close()

1597

f.close()

1595

dd = actual - expected

1598

dd = actual - expected

1596

except IOError as inst:

1599

except IOError as inst:

1597

if inst.errno != errno.ENOENT:

1600

if inst.errno != errno.ENOENT:

1598

raise

1601

raise

1599

dd = 0

1602

dd = 0

1600

1603

1601

try:

1604

try:

1602

f = self.opener(self.indexfile)

1605

f = self.opener(self.indexfile)

1603

f.seek(0, 2)

1606

f.seek(0, 2)

1604

actual = f.tell()

1607

actual = f.tell()

1605

f.close()

1608

f.close()

1606

s = self._io.size

1609

s = self._io.size

1607

i = max(0, actual // s)

1610

i = max(0, actual // s)

1608

di = actual - (i * s)

1611

di = actual - (i * s)

1609

if self._inline:

1612

if self._inline:

1610

databytes = 0

1613

databytes = 0

1611

for r in self:

1614

for r in self:

1612

databytes += max(0, self.length(r))

1615

databytes += max(0, self.length(r))

1613

dd = 0

1616

dd = 0

1614

di = actual - len(self) * s - databytes

1617

di = actual - len(self) * s - databytes

1615

except IOError as inst:

1618

except IOError as inst:

1616

if inst.errno != errno.ENOENT:

1619

if inst.errno != errno.ENOENT:

1617

raise

1620

raise

1618

di = 0

1621

di = 0

1619

1622

1620

return (dd, di)

1623

return (dd, di)

1621

1624

1622

def files(self):

1625

def files(self):

1623

res = [self.indexfile]

1626

res = [self.indexfile]

1624

if not self._inline:

1627

if not self._inline:

1625

res.append(self.datafile)

1628

res.append(self.datafile)

1626

return res

1629

return res

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # revlog.py - storage back-end for mercurial
             #
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             # import stuff from node for others to import from revlog
             import collections
             from node import bin, hex, nullid, nullrev
             from i18n import _
             import ancestor, mdiff, parsers, error, util, templatefilters
             import struct, zlib, errno
             _pack = struct.pack
             _unpack = struct.unpack
             _compress = zlib.compress
             _decompress = zlib.decompress
             _sha = util.sha1
             # revlog header flags
             REVLOGV0 = 0
             REVLOGNG = 1
             REVLOGNGINLINEDATA = (1 << 16)
             REVLOGGENERALDELTA = (1 << 17)
             REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA
             REVLOG_DEFAULT_FORMAT = REVLOGNG
             REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS
             REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGGENERALDELTA
             # revlog index flags
             REVIDX_ISCENSORED = (1 << 15) # revision has censor metadata, must be verified
             REVIDX_DEFAULT_FLAGS = 0
             REVIDX_KNOWN_FLAGS = REVIDX_ISCENSORED
             # max size of revlog with inline data
             _maxinline = 131072
             _chunksize = 1048576
             RevlogError = error.RevlogError
             LookupError = error.LookupError
             CensoredNodeError = error.CensoredNodeError
             def getoffset(q):
                 return int(q >> 16)
             def gettype(q):
                 return int(q & 0xFFFF)
             def offset_type(offset, type):
                 return long(long(offset) << 16 | type)
             _nullhash = _sha(nullid)
             def hash(text, p1, p2):
                 """generate a hash from the given text and its parent hashes
                 This hash combines both the current file contents and its history
                 in a manner that makes it easy to distinguish nodes with the same
                 content in the revision graph.
                 """
                 # As of now, if one of the parent node is null, p2 is null
                 if p2 == nullid:
                     # deep copy of a hash is faster than creating one
                     s = _nullhash.copy()
                     s.update(p1)
                 else:
                     # none of the parent nodes are nullid
                     l = [p1, p2]
                     l.sort()
                     s = _sha(l[0])
                     s.update(l[1])
                 s.update(text)
                 return s.digest()
             def decompress(bin):
                 """ decompress the given input """
                 if not bin:
                     return bin
                 t = bin[0]
                 if t == '\0':
                     return bin
                 if t == 'x':
                     try:
                         return _decompress(bin)
                     except zlib.error as e:
                         raise RevlogError(_("revlog decompress error: %s") % str(e))
                 if t == 'u':
                     return bin[1:]
                 raise RevlogError(_("unknown compression type %r") % t)
             # index v0:
             #  4 bytes: offset
             #  4 bytes: compressed length
             #  4 bytes: base rev
             #  4 bytes: link rev
             # 20 bytes: parent 1 nodeid
             # 20 bytes: parent 2 nodeid
             # 20 bytes: nodeid
             indexformatv0 = ">4l20s20s20s"
             class revlogoldio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatv0)
                 def parseindex(self, data, inline):
                     s = self.size
                     index = []
                     nodemap =  {nullid: nullrev}
                     n = off = 0
                     l = len(data)
                     while off + s <= l:
                         cur = data[off:off + s]
                         off += s
                         e = _unpack(indexformatv0, cur)
                         # transform to revlogv1 format
                         e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],
                               nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])
                         index.append(e2)
                         nodemap[e[6]] = n
                         n += 1
                     # add the magic null revision at -1
                     index.append((0, 0, 0, -1, -1, -1, -1, nullid))
                     return index, nodemap, None
                 def packentry(self, entry, node, version, rev):
                     if gettype(entry[0]):
                         raise RevlogError(_("index entry flags need RevlogNG"))
                     e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],
                           node(entry[5]), node(entry[6]), entry[7])
                     return _pack(indexformatv0, *e2)
             # index ng:
             #  6 bytes: offset
             #  2 bytes: flags
             #  4 bytes: compressed length
             #  4 bytes: uncompressed length
             #  4 bytes: base rev
             #  4 bytes: link rev
             #  4 bytes: parent 1 rev
             #  4 bytes: parent 2 rev
             # 32 bytes: nodeid
             indexformatng = ">Qiiiiii20s12x"
             versionformat = ">I"
             # corresponds to uncompressed length of indexformatng (2 gigs, 4-byte
             # signed integer)
             _maxentrysize = 0x7fffffff
             class revlogio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatng)
                 def parseindex(self, data, inline):
                     # call the C implementation to parse the index data
                     index, cache = parsers.parse_index2(data, inline)
                     return index, getattr(index, 'nodemap', None), cache
                 def packentry(self, entry, node, version, rev):
                     p = _pack(indexformatng, *entry)
                     if rev == 0:
                         p = _pack(versionformat, version) + p[4:]
                     return p
             class revlog(object):
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 """
                 def __init__(self, opener, indexfile):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     """
                     self.indexfile = indexfile
                     self.datafile = indexfile[:-2] + ".d"
                     self.opener = opener
                     self._cache = None
                     self._basecache = None
                     self._chunkcache = (0, '')
                     self._chunkcachesize = 65536
                     self._maxchainlen = None
                     self.index = []
                     self._pcache = {}
                     self._nodecache = {nullid: nullrev}
                     self._nodepos = None
                     v = REVLOG_DEFAULT_VERSION
                     opts = getattr(opener, 'options', None)
                     if opts is not None:
                         if 'revlogv1' in opts:
                             if 'generaldelta' in opts:
                                 v |= REVLOGGENERALDELTA
                         else:
                             v = 0
                         if 'chunkcachesize' in opts:
                             self._chunkcachesize = opts['chunkcachesize']
                         if 'maxchainlen' in opts:
                             self._maxchainlen = opts['maxchainlen']
                     if self._chunkcachesize <= 0:
                         raise RevlogError(_('revlog chunk cache size %r is not greater '
                                             'than 0') % self._chunkcachesize)
                     elif self._chunkcachesize & (self._chunkcachesize - 1):
                         raise RevlogError(_('revlog chunk cache size %r is not a power '
                                             'of 2') % self._chunkcachesize)
                     i = ''
                     self._initempty = True
                     try:
                         f = self.opener(self.indexfile)
                         i = f.read()
                         f.close()
                         if len(i) > 0:
                             v = struct.unpack(versionformat, i[:4])[0]
                             self._initempty = False
                     except IOError as inst:
                         if inst.errno != errno.ENOENT:
                             raise
                     self.version = v
                     self._inline = v & REVLOGNGINLINEDATA
                     self._generaldelta = v & REVLOGGENERALDELTA
                     flags = v & ~0xFFFF
                     fmt = v & 0xFFFF
                     if fmt == REVLOGV0 and flags:
                         raise RevlogError(_("index %s unknown flags %#04x for format v0")
                                           % (self.indexfile, flags >> 16))
                     elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:
                         raise RevlogError(_("index %s unknown flags %#04x for revlogng")
                                           % (self.indexfile, flags >> 16))
                     elif fmt > REVLOGNG:
                         raise RevlogError(_("index %s unknown format %d")
                                           % (self.indexfile, fmt))
                     self._io = revlogio()
                     if self.version == REVLOGV0:
                         self._io = revlogoldio()
                     try:
                         d = self._io.parseindex(i, self._inline)
                     except (ValueError, IndexError):
                         raise RevlogError(_("index %s is corrupted") % (self.indexfile))
                     self.index, nodemap, self._chunkcache = d
                     if nodemap is not None:
                         self.nodemap = self._nodecache = nodemap
                     if not self._chunkcache:
                         self._chunkclear()
                     # revnum -> (chain-length, sum-delta-length)
                     self._chaininfocache = {}
                 def tip(self):
                     return self.node(len(self.index) - 2)
                 def __contains__(self, rev):
                     return 0 <= rev < len(self)
                 def __len__(self):
                     return len(self.index) - 1
                 def __iter__(self):
                     return iter(xrange(len(self)))
                 def revs(self, start=0, stop=None):
                     """iterate over all rev in this revlog (from start to stop)"""
                     step = 1
                     if stop is not None:
                         if start > stop:
                             step = -1
                         stop += step
                     else:
                         stop = len(self)
                     return xrange(start, stop, step)
                 @util.propertycache
                 def nodemap(self):
                     self.rev(self.node(0))
                     return self._nodecache
                 def hasnode(self, node):
                     try:
                         self.rev(node)
                         return True
                     except KeyError:
                         return False
                 def clearcaches(self):
                     try:
                         self._nodecache.clearcaches()
                     except AttributeError:
                         self._nodecache = {nullid: nullrev}
                         self._nodepos = None
                 def rev(self, node):
                     try:
                         return self._nodecache[node]
                     except TypeError:
                         raise
                     except RevlogError:
                         # parsers.c radix tree lookup failed
                         raise LookupError(node, self.indexfile, _('no node'))
                     except KeyError:
                         # pure python cache lookup failed
                         n = self._nodecache
                         i = self.index
                         p = self._nodepos
                         if p is None:
                             p = len(i) - 2
                         for r in xrange(p, -1, -1):
                             v = i[r][7]
                             n[v] = r
                             if v == node:
                                 self._nodepos = r - 1
                                 return r
                         raise LookupError(node, self.indexfile, _('no node'))
                 def node(self, rev):
                     return self.index[rev][7]
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline
                 def parentrevs(self, rev):
                     return self.index[rev][5:7]
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def length(self, rev):
                     return self.index[rev][1]
                 def chainbase(self, rev):
                     index = self.index
                     base = index[rev][3]
                     while base != rev:
                         rev = base
                         base = index[rev][3]
                     return base
                 def chainlen(self, rev):
                     return self._chaininfo(rev)[0]
                 def _chaininfo(self, rev):
                     chaininfocache = self._chaininfocache
                     if rev in chaininfocache:
                         return chaininfocache[rev]
                     index = self.index
                     generaldelta = self._generaldelta
                     iterrev = rev
                     e = index[iterrev]
                     clen = 0
                     compresseddeltalen = 0
                     while iterrev != e[3]:
                         clen += 1
                         compresseddeltalen += e[1]
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         if iterrev in chaininfocache:
                             t = chaininfocache[iterrev]
                             clen += t[0]
                             compresseddeltalen += t[1]
                             break
                         e = index[iterrev]
                     else:
                         # Add text length of base since decompressing that also takes
                         # work. For cache hits the length is already included.
                         compresseddeltalen += e[1]
                     r = (clen, compresseddeltalen)
                     chaininfocache[rev] = r
                     return r
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.revision(self.node(rev))
                     return len(t)
                 size = rawsize
                 def ancestors(self, revs, stoprev=0, inclusive=False):
                     """Generate the ancestors of 'revs' in reverse topological order.
                     Does not generate revs lower than stoprev.
                     See the documentation for ancestor.lazyancestors for more details."""
                     return ancestor.lazyancestors(self.parentrevs, revs, stoprev=stoprev,
                                                   inclusive=inclusive)
                 def descendants(self, revs):
                     """Generate the descendants of 'revs' in revision order.
                     Yield a sequence of revision numbers starting with a child of
                     some rev in revs, i.e., each revision is *not* considered a
                     descendant of itself.  Results are ordered by revision number (a
                     topological sort)."""
                     first = min(revs)
                     if first == nullrev:
                         for i in self:
                             yield i
                         return
                     seen = set(revs)
                     for i in self.revs(start=first + 1):
                         for x in self.parentrevs(i):
                             if x != nullrev and x in seen:
                                 seen.add(i)
                                 yield i
                                 break
                 def findcommonmissing(self, common=None, heads=None):
                     """Return a tuple of the ancestors of common and the ancestors of heads
                     that are not ancestors of common. In revset terminology, we return the
                     tuple:
                       ::common, (::heads) - (::common)
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     class lazyset(object):
                         def __init__(self, lazyvalues):
                             self.addedvalues = set()
                             self.lazyvalues = lazyvalues
                         def __contains__(self, value):
                             return value in self.addedvalues or value in self.lazyvalues
                         def __iter__(self):
                             added = self.addedvalues
                             for r in added:
                                 yield r
                             for r in self.lazyvalues:
                                 if not r in added:
                                     yield r
                         def add(self, value):
                             self.addedvalues.add(value)
                         def update(self, values):
                             self.addedvalues.update(values)
                     has = lazyset(self.ancestors(common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = collections.deque(r for r in heads if r not in has)
                     while visit:
                         r = visit.popleft()
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return has, [self.node(r) for r in missing]
                 def incrementalmissingrevs(self, common=None):
                     """Return an object that can be used to incrementally compute the
                     revision numbers of the ancestors of arbitrary sets that are not
                     ancestors of common. This is an ancestor.incrementalmissingancestors
                     object.
                     'common' is a list of revision numbers. If common is not supplied, uses
                     nullrev.
                     """
                     if common is None:
                         common = [nullrev]
                     return ancestor.incrementalmissingancestors(self.parentrevs, common)
                 def findmissingrevs(self, common=None, heads=None):
                     """Return the revision numbers of the ancestors of heads that
                     are not ancestors of common.
                     More specifically, return a list of revision numbers corresponding to
                     nodes N such that every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of revision numbers.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullrev]
                     if heads is None:
                         heads = self.headrevs()
                     inc = self.incrementalmissingrevs(common=common)
                     return inc.missingancestors(heads)
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     inc = self.incrementalmissingrevs(common=common)
                     return [self.node(r) for r in inc.missingancestors(heads)]
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [nullid] # Everybody's a descendant of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return ([self.node(r) for r in self], [nullid], list(self.heads()))
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, False)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendant of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n) # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update([p for p in self.parents(n) if
                                                        p != nullid])
                                 elif n in heads: # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [n for n in roots if n in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(n) for n in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [nullid]
                     # Transform our roots list into a set.
                     descendants = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendants.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descendants, empty parents will look like
                     # they're descendants.
                     for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):
                         n = self.node(r)
                         isdescendant = False
                         if lowestrev == nullrev:  # Everybody is a descendant of nullid
                             isdescendant = True
                         elif n in descendants:
                             # n is already a descendant
                             isdescendant = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendants before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendants, it's not a root.
                                 if (p[0] in descendants) or (p[1] in descendants):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendant if either of its parents are
                             # descendants.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendants) or (p[1] in descendants):
                                 descendants.add(n)
                                 isdescendant = True
                         if isdescendant and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendants and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = True
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = True
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [n for n, flag in heads.iteritems() if flag]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def headrevs(self):
                     try:
                         return self.index.headrevs()
                     except AttributeError:
                         return self._headrevs()
                 def computephases(self, roots):
                     return self.index.computephasesmapsets(roots)
                 def _headrevs(self):
                     count = len(self)
                     if not count:
                         return [nullrev]
                     # we won't iter over filtered rev so nobody is a head at start
                     ishead = [0] * (count + 1)
                     index = self.index
                     for r in self:
                         ishead[r] = 1  # I may be an head
                         e = index[r]
                         ishead[e[5]] = ishead[e[6]] = 0  # my parent are not
                     return [r for r, val in enumerate(ishead) if val]
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         if not len(self):
                             return [nullid]
                         return [self.node(r) for r in self.headrevs()]
                     if start is None:
                         start = nullid
                     if stop is None:
                         stop = []
                     stoprevs = set([self.rev(n) for n in stop])
                     startrev = self.rev(start)
                     reachable = set((startrev,))
                     heads = set((startrev,))
                     parentrevs = self.parentrevs
                     for r in self.revs(start=startrev + 1):
                         for p in parentrevs(r):
                             if p in reachable:
                                 if r not in stoprevs:
                                     reachable.add(r)
                                 heads.add(r)
                             if p in heads and p not in stoprevs:
                                 heads.remove(p)
                     return [self.node(r) for r in heads]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in self.revs(start=p + 1):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def descendant(self, start, end):
                     if start == nullrev:
                         return True
                     for i in self.descendants([start]):
                         if i == end:
                             return True
                         elif i > end:
                             break
                     return False
                 def commonancestorsheads(self, a, b):
                     """calculate all the heads of the common ancestors of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     try:
                         ancs = self.index.commonancestorsheads(a, b)
                     except (AttributeError, OverflowError): # C implementation failed
                         ancs = ancestor.commonancestorsheads(self.parentrevs, a, b)
                     return map(self.node, ancs)
                 def isancestor(self, a, b):
                     """return True if node a is an ancestor of node b
                     The implementation of this is trivial but the use of
                     commonancestorsheads is not."""
                     return a in self.commonancestorsheads(a, b)
                 def ancestor(self, a, b):
                     """calculate the "best" common ancestor of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     try:
                         ancs = self.index.ancestors(a, b)
                     except (AttributeError, OverflowError):
                         ancs = ancestor.ancestors(self.parentrevs, a, b)
                     if ancs:
                         # choose a consistent winner when there's a tie
                         return min(map(self.node, ancs))
                     return nullid
                 def _match(self, id):
                     if isinstance(id, int):
                         # rev
                         return self.node(id)
                     if len(id) == 20:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node) # quick search the index
                             return node
                         except LookupError:
                             pass # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if str(rev) != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 40:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (TypeError, LookupError):
                             pass
                 def _partialmatch(self, id):
                     try:
                         n = self.index.partialmatch(id)
                         if n and self.hasnode(n):
                             return n
                         return None
                     except RevlogError:
                         # parsers.c radix tree lookup gave multiple matches
                         # fall through to slow path that filters hidden revisions
                         pass
                     except (AttributeError, ValueError):
                         # we are pure python, or key was too short to search radix tree
                         pass
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) < 40:
                         try:
                             # hex(node)[:...]
                             l = len(id) // 2  # grab an even number of digits
                             prefix = bin(id[:l * 2])
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [n for n in nl if hex(n).startswith(id) and
                                   self.hasnode(n)]
                             if len(nl) > 0:
                                 if len(nl) == 1:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise LookupError(id, self.indexfile,
                                                   _('ambiguous identifier'))
                             return None
                         except TypeError:
                             pass
                 def lookup(self, id):
                     """locate a node based on:
                         - revision number or str(revision number)
                         - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise LookupError(id, self.indexfile, _('no match found'))
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return hash(text, p1, p2) != node
                 def _addchunk(self, offset, data):
                     o, d = self._chunkcache
                     # try to add to existing cache
                     if o + len(d) == offset and len(d) + len(data) < _chunksize:
                         self._chunkcache = o, d + data
                     else:
                         self._chunkcache = offset, data
                 def _loadchunk(self, offset, length):
                     if self._inline:
                         df = self.opener(self.indexfile)
                     else:
                         df = self.opener(self.datafile)
                     # Cache data both forward and backward around the requested
                     # data, in a fixed size window. This helps speed up operations
                     # involving reading the revlog backwards.
                     cachesize = self._chunkcachesize
                     realoffset = offset & ~(cachesize - 1)
                     reallength = (((offset + length + cachesize) & ~(cachesize - 1))
                                   - realoffset)
                     df.seek(realoffset)
                     d = df.read(reallength)
                     df.close()
                     self._addchunk(realoffset, d)
                     if offset != realoffset or reallength != length:
                         return util.buffer(d, offset - realoffset, length)
                     return d
                 def _getchunk(self, offset, length):
                     o, d = self._chunkcache
                     l = len(d)
                     # is it in the cache?
                     cachestart = offset - o
                     cacheend = cachestart + length
                     if cachestart >= 0 and cacheend <= l:
                         if cachestart == 0 and cacheend == l:
                             return d # avoid a copy
                         return util.buffer(d, cachestart, cacheend - cachestart)
                     return self._loadchunk(offset, length)
                 def _chunkraw(self, startrev, endrev):
                     start = self.start(startrev)
                     end = self.end(endrev)
                     if self._inline:
                         start += (startrev + 1) * self._io.size
                         end += (endrev + 1) * self._io.size
                     length = end - start
                     return self._getchunk(start, length)
                 def _chunk(self, rev):
                     return decompress(self._chunkraw(rev, rev))
                 def _chunks(self, revs):
                     '''faster version of [self._chunk(rev) for rev in revs]
                     Assumes that revs is in ascending order.'''
                     if not revs:
                         return []
                     start = self.start
                     length = self.length
                     inline = self._inline
                     iosize = self._io.size
                     buffer = util.buffer
                     l = []
                     ladd = l.append
                     # preload the cache
                     try:
                         while True:
                             # ensure that the cache doesn't change out from under us
                             _cache = self._chunkcache
                             self._chunkraw(revs[0], revs[-1])
                             if _cache == self._chunkcache:
                                 break
                         offset, data = _cache
                     except OverflowError:
                         # issue4215 - we can't cache a run of chunks greater than
                         # 2G on Windows
                         return [self._chunk(rev) for rev in revs]
                     for rev in revs:
                         chunkstart = start(rev)
                         if inline:
                             chunkstart += (rev + 1) * iosize
                         chunklength = length(rev)
                         ladd(decompress(buffer(data, chunkstart - offset, chunklength)))
                     return l
                 def _chunkclear(self):
                     self._chunkcache = (0, '')
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self._generaldelta:
                         return base
                     else:
                         return rev - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions"""
                     if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                         return str(self._chunk(rev2))
                     return mdiff.textdiff(self.revision(rev1),
                                           self.revision(rev2))
                 def revision(self, nodeorrev):
                     """return an uncompressed revision of a given node or revision
                     number.
                     """
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                         node = self.node(rev)
                     else:
                         node = nodeorrev
                         rev = None
                     _cache = self._cache # grab local copy of cache to avoid thread race
                     cachedrev = None
                     if node == nullid:
                         return ""
                     if _cache:
                         if _cache[0] == node:
                             return _cache[2]
                         cachedrev = _cache[1]
                     # look up what we need to read
                     text = None
                     if rev is None:
                         rev = self.rev(node)
                     # check rev flags
                     if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:
                         raise RevlogError(_('incompatible revision flag %x') %
                                           (self.flags(rev) & ~REVIDX_KNOWN_FLAGS))
                     # build delta chain
                     chain = []
                     index = self.index # for performance
                     generaldelta = self._generaldelta
                     iterrev = rev
                     e = index[iterrev]
                     while iterrev != e[3] and iterrev != cachedrev:
                         chain.append(iterrev)
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         e = index[iterrev]
                     if iterrev == cachedrev:
                         # cache hit
                         text = _cache[2]
                     else:
                         chain.append(iterrev)
                     chain.reverse()
                     # drop cache to save memory
                     self._cache = None
                     bins = self._chunks(chain)
                     if text is None:
                         text = str(bins[0])
                         bins = bins[1:]
                     text = mdiff.patches(text, bins)
                     text = self._checkhash(text, node, rev)
                     self._cache = (node, rev, text)
                     return text
                 def hash(self, text, p1, p2):
                     """Compute a node hash.
                     Available as a function so that subclasses can replace the hash
                     as needed.
                     """
                     return hash(text, p1, p2)
                 def _checkhash(self, text, node, rev):
                     p1, p2 = self.parents(node)
                     self.checkhash(text, p1, p2, node, rev)
                     return text
                 def checkhash(self, text, p1, p2, node, rev=None):
                     if node != self.hash(text, p1, p2):
                         revornode = rev
                         if revornode is None:
                             revornode = templatefilters.short(hex(node))
                         raise RevlogError(_("integrity check failed on %s:%s")
                             % (self.indexfile, revornode))
                 def checkinlinesize(self, tr, fp=None):
                     if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:
                         return
                     trinfo = tr.find(self.indexfile)
                     if trinfo is None:
                         raise RevlogError(_("%s not found in the transaction")
                                           % self.indexfile)
                     trindex = trinfo[2]
                     if trindex is not None:
                         dataoff = self.start(trindex)
                     else:
                         # revlog was stripped at start of transaction, use all leftover data
                         trindex = len(self) - 1
                         dataoff = self.end(-2)
                     tr.add(self.datafile, dataoff)
                     if fp:
                         fp.flush()
                         fp.close()
                     df = self.opener(self.datafile, 'w')
                     try:
                         for r in self:
                             df.write(self._chunkraw(r, r))
                     finally:
                         df.close()
                     fp = self.opener(self.indexfile, 'w', atomictemp=True)
                     self.version &= ~(REVLOGNGINLINEDATA)
                     self._inline = False
                     for i in self:
                         e = self._io.packentry(self.index[i], self.node, self.version, i)
                         fp.write(e)
                     # if we don't call close, the temp file will never replace the
                     # real index
                     fp.close()
                     tr.replace(self.indexfile, trindex * self._io.size)
                     self._chunkclear()
                 def addrevision(self, text, transaction, link, p1, p2, cachedelta=None,
                                 node=None):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     node - nodeid of revision; typically node is not specified, and it is
                         computed by default as hash(text, p1, p2), however subclasses might
                         use different hashing method (and override checkhash() in such case)
                     """
                     if link == nullrev:
                         raise RevlogError(_("attempted to add linkrev -1 to %s")
                                           % self.indexfile)
                     if len(text) > _maxentrysize:
                         raise RevlogError(
                             _("%s: size of %d bytes exceeds maximum revlog storage of 2GiB")
                             % (self.indexfile, len(text)))
                     node = node or self.hash(text, p1, p2)
                     if node in self.nodemap:
                         return node
                     dfh = None
                     if not self._inline:
                         dfh = self.opener(self.datafile, "a")
                     ifh = self.opener(self.indexfile, "a+")
                     try:
                         return self._addrevision(node, text, transaction, link, p1, p2,
                                                  REVIDX_DEFAULT_FLAGS, cachedelta, ifh, dfh)
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                 def compress(self, text):
                     """ generate a possibly-compressed representation of text """
                     if not text:
                         return ("", text)
                     l = len(text)
                     bin = None
                     if l < 44:
                         pass
                     elif l > 1000000:
                         # zlib makes an internal copy, thus doubling memory usage for
                         # large files, so lets do this in pieces
                         z = zlib.compressobj()
                         p = []
                         pos = 0
                         while pos < l:
                             pos2 = pos + 2**20
                             p.append(z.compress(text[pos:pos2]))
                             pos = pos2
                         p.append(z.flush())
                         if sum(map(len, p)) < l:
                             bin = "".join(p)
                     else:
                         bin = _compress(text)
                     if bin is None or len(bin) > l:
                         if text[0] == '\0':
                             return ("", text)
                         return ('u', text)
                     return ("", bin)
                 def _isgooddelta(self, d, textlen):
                     """Returns True if the given delta is good. Good means that it is within
                     the disk span, disk size, and chain length bounds that we know to be
                     performant."""
                     if d is None:
                         return False
                     # - 'dist' is the distance from the base revision -- bounding it limits
                     #   the amount of I/O we need to do.
                     # - 'compresseddeltalen' is the sum of the total size of deltas we need
                     #   to apply -- bounding it limits the amount of CPU we consume.
                     dist, l, data, base, chainbase, chainlen, compresseddeltalen = d
                     if (dist > textlen * 4 or l > textlen or
                         compresseddeltalen > textlen * 2 or
                         (self._maxchainlen and chainlen > self._maxchainlen)):
                         return False
                     return True
                 def _addrevision(self, node, text, transaction, link, p1, p2, flags,
                                  cachedelta, ifh, dfh):
                     """internal function to add revisions to the log
                     see addrevision for argument descriptions.
                     invariants:
                     - text is optional (can be None); if not set, cachedelta must be set.
                       if both are set, they must correspond to each other.
                     """
                     btext = [text]
                     def buildtext():
                         if btext[0] is not None:
                             return btext[0]
                         # flush any pending writes here so we can read it in revision
                         if dfh:
                             dfh.flush()
                         ifh.flush()
                         baserev = cachedelta[0]
                         delta = cachedelta[1]
                         # special case deltas which replace entire base; no need to decode
                         # base revision. this neatly avoids censored bases, which throw when
                         # they're decoded.
                         hlen = struct.calcsize(">lll")
                         if delta[:hlen] == mdiff.replacediffheader(self.rawsize(baserev),
                                                                    len(delta) - hlen):
                             btext[0] = delta[hlen:]
                         else:
                             basetext = self.revision(self.node(baserev))
                             btext[0] = mdiff.patch(basetext, delta)
                         try:
                             self.checkhash(btext[0], p1, p2, node)
                             if flags & REVIDX_ISCENSORED:
                                 raise RevlogError(_('node %s is not censored') % node)
                         except CensoredNodeError:
                             # must pass the censored index flag to add censored revisions
                             if not flags & REVIDX_ISCENSORED:
                                 raise
                         return btext[0]
                     def builddelta(rev):
                         # can we use the cached delta?
                         if cachedelta and cachedelta[0] == rev:
                             delta = cachedelta[1]
                         else:
                             t = buildtext()
                             if self.iscensored(rev):
                                 # deltas based on a censored revision must replace the
                                 # full content in one patch, so delta works everywhere
                                 header = mdiff.replacediffheader(self.rawsize(rev), len(t))
                                 delta = header + t
                             else:
                                 ptext = self.revision(self.node(rev))
                                 delta = mdiff.textdiff(ptext, t)
                         data = self.compress(delta)
                         l = len(data[1]) + len(data[0])
                         if basecache[0] == rev:
                             chainbase = basecache[1]
                         else:
                             chainbase = self.chainbase(rev)
                         dist = l + offset - self.start(chainbase)
                         if self._generaldelta:
                             base = rev
                         else:
                             base = chainbase
                         chainlen, compresseddeltalen = self._chaininfo(rev)
                         chainlen += 1
                         compresseddeltalen += l
                         return dist, l, data, base, chainbase, chainlen, compresseddeltalen
                     curr = len(self)
                     prev = curr - 1
                     base = chainbase = curr
                     chainlen = None
                     offset = self.end(prev)
                     d = None
                     if self._basecache is None:
                         self._basecache = (prev, self.chainbase(prev))
                     basecache = self._basecache
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if text is None:
                         textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),
                                                     cachedelta[1])
                     else:
                         textlen = len(text)
                     # should we try to build a delta?
                     if prev != nullrev:
                         if self._generaldelta:
-                            if p1r >= basecache[1]:
+                            # Pick whichever parent is closer to us (to minimize the
-                                d = builddelta(p1r)
+                            # chance of having to build a fulltext). Since
-                            elif p2r >= basecache[1]:
+                            # nullrev == -1, any non-merge commit will always pick p1r.
-                                d = builddelta(p2r)
+                            drev = p2r if p2r > p1r else p1r
-                            else:
+                            d = builddelta(drev)
+                            # If the chosen delta will result in us making a full text,
+                            # give it one last try against prev.
+                            if drev != prev and not self._isgooddelta(d, textlen):
                                 d = builddelta(prev)
                         else:
                             d = builddelta(prev)
                         dist, l, data, base, chainbase, chainlen, compresseddeltalen = d
                     if not self._isgooddelta(d, textlen):
                         text = buildtext()
                         data = self.compress(text)
                         l = len(data[1]) + len(data[0])
                         base = chainbase = curr
                     e = (offset_type(offset, flags), l, textlen,
                          base, link, p1r, p2r, node)
                     self.index.insert(-1, e)
                     self.nodemap[node] = curr
                     entry = self._io.packentry(e, self.node, self.version, curr)
                     self._writeentry(transaction, ifh, dfh, entry, data, link, offset)
                     if type(text) == str: # only accept immutable objects
                         self._cache = (node, curr, text)
                     self._basecache = (curr, chainbase)
                     return node
                 def _writeentry(self, transaction, ifh, dfh, entry, data, link, offset):
                     curr = len(self) - 1
                     if not self._inline:
                         transaction.add(self.datafile, offset)
                         transaction.add(self.indexfile, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         dfh.flush()
                         ifh.write(entry)
                     else:
                         offset += curr * self._io.size
                         transaction.add(self.indexfile, offset, curr)
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                         self.checkinlinesize(transaction, ifh)
                 def addgroup(self, bundle, linkmapper, transaction, addrevisioncb=None):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     If ``addrevisioncb`` is defined, it will be called with arguments of
                     this revlog and the node that was added.
                     """
                     # track the base of the current delta log
                     content = []
                     node = None
                     r = len(self)
                     end = 0
                     if r:
                         end = self.end(r - 1)
                     ifh = self.opener(self.indexfile, "a+")
                     isize = r * self._io.size
                     if self._inline:
                         transaction.add(self.indexfile, end + isize, r)
                         dfh = None
                     else:
                         transaction.add(self.indexfile, isize, r)
                         transaction.add(self.datafile, end)
                         dfh = self.opener(self.datafile, "a")
                     def flush():
                         if dfh:
                             dfh.flush()
                         ifh.flush()
                     try:
                         # loop through our set of deltas
                         chain = None
                         while True:
                             chunkdata = bundle.deltachunk(chain)
                             if not chunkdata:
                                 break
                             node = chunkdata['node']
                             p1 = chunkdata['p1']
                             p2 = chunkdata['p2']
                             cs = chunkdata['cs']
                             deltabase = chunkdata['deltabase']
                             delta = chunkdata['delta']
                             content.append(node)
                             link = linkmapper(cs)
                             if node in self.nodemap:
                                 # this can happen if two branches make the same change
                                 chain = node
                                 continue
                             for p in (p1, p2):
                                 if p not in self.nodemap:
                                     raise LookupError(p, self.indexfile,
                                                       _('unknown parent'))
                             if deltabase not in self.nodemap:
                                 raise LookupError(deltabase, self.indexfile,
                                                   _('unknown delta base'))
                             baserev = self.rev(deltabase)
                             if baserev != nullrev and self.iscensored(baserev):
                                 # if base is censored, delta must be full replacement in a
                                 # single patch operation
                                 hlen = struct.calcsize(">lll")
                                 oldlen = self.rawsize(baserev)
                                 newlen = len(delta) - hlen
                                 if delta[:hlen] != mdiff.replacediffheader(oldlen, newlen):
                                     raise error.CensoredBaseError(self.indexfile,
                                                                   self.node(baserev))
                             flags = REVIDX_DEFAULT_FLAGS
                             if self._peek_iscensored(baserev, delta, flush):
                                 flags |= REVIDX_ISCENSORED
                             chain = self._addrevision(node, None, transaction, link,
                                                       p1, p2, flags, (baserev, delta),
                                                       ifh, dfh)
                             if addrevisioncb:
                                 # Data for added revision can't be read unless flushed
                                 # because _loadchunk always opensa new file handle and
                                 # there is no guarantee data was actually written yet.
                                 flush()
                                 addrevisioncb(self, chain)
                             if not dfh and not self._inline:
                                 # addrevision switched from inline to conventional
                                 # reopen the index
                                 ifh.close()
                                 dfh = self.opener(self.datafile, "a")
                                 ifh = self.opener(self.indexfile, "a")
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                     return content
                 def iscensored(self, rev):
                     """Check if a file revision is censored."""
                     return False
                 def _peek_iscensored(self, baserev, delta, flush):
                     """Quickly check if a delta produces a censored revision."""
                     return False
                 def getstrippoint(self, minlink):
                     """find the minimum rev that must be stripped to strip the linkrev
                     Returns a tuple containing the minimum rev and a set of all revs that
                     have linkrevs that will be broken by this strip.
                     """
                     brokenrevs = set()
                     strippoint = len(self)
                     heads = {}
                     futurelargelinkrevs = set()
                     for head in self.headrevs():
                         headlinkrev = self.linkrev(head)
                         heads[head] = headlinkrev
                         if headlinkrev >= minlink:
                             futurelargelinkrevs.add(headlinkrev)
                     # This algorithm involves walking down the rev graph, starting at the
                     # heads. Since the revs are topologically sorted according to linkrev,
                     # once all head linkrevs are below the minlink, we know there are
                     # no more revs that could have a linkrev greater than minlink.
                     # So we can stop walking.
                     while futurelargelinkrevs:
                         strippoint -= 1
                         linkrev = heads.pop(strippoint)
                         if linkrev < minlink:
                             brokenrevs.add(strippoint)
                         else:
                             futurelargelinkrevs.remove(linkrev)
                         for p in self.parentrevs(strippoint):
                             if p != nullrev:
                                 plinkrev = self.linkrev(p)
                                 heads[p] = plinkrev
                                 if plinkrev >= minlink:
                                     futurelargelinkrevs.add(plinkrev)
                     return strippoint, brokenrevs
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll re-add them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     rev, _ = self.getstrippoint(minlink)
                     if rev == len(self):
                         return
                     # first truncate the files on disk
                     end = self.start(rev)
                     if not self._inline:
                         transaction.add(self.datafile, end)
                         end = rev * self._io.size
                     else:
                         end += rev * self._io.size
                     transaction.add(self.indexfile, end)
                     # then reset internal state in memory to forget those revisions
                     self._cache = None
                     self._chaininfocache = {}
                     self._chunkclear()
                     for x in xrange(rev, len(self)):
                         del self.nodemap[self.node(x)]
                     del self.index[rev:-1]
                 def checksize(self):
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         f = self.opener(self.datafile)
                         f.seek(0, 2)
                         actual = f.tell()
                         f.close()
                         dd = actual - expected
                     except IOError as inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         dd = 0
                     try:
                         f = self.opener(self.indexfile)
                         f.seek(0, 2)
                         actual = f.tell()
                         f.close()
                         s = self._io.size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except IOError as inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         di = 0
                     return (dd, di)
                 def files(self):
                     res = [self.indexfile]
                     if not self._inline:
                         res.append(self.datafile)
                     return res