upstream/mercurial-mirror Commit - r22785:abc44fcc

1

# revlog.py - storage back-end for mercurial

1

# revlog.py - storage back-end for mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

"""Storage back-end for Mercurial.

8

"""Storage back-end for Mercurial.

9

10

This provides efficient delta storage with O(1) retrieve and append

10

This provides efficient delta storage with O(1) retrieve and append

11

and O(changes) merge between branches.

11

and O(changes) merge between branches.

12

"""

12

"""

13

14

# import stuff from node for others to import from revlog

14

# import stuff from node for others to import from revlog

15

from node import bin, hex, nullid, nullrev

15

from node import bin, hex, nullid, nullrev

16

from i18n import _

16

from i18n import _

17

import ancestor, mdiff, parsers, error, util, templatefilters

17

import ancestor, mdiff, parsers, error, util, templatefilters

18

import struct, zlib, errno

18

import struct, zlib, errno

19

20

_pack = struct.pack

20

_pack = struct.pack

21

_unpack = struct.unpack

21

_unpack = struct.unpack

22

_compress = zlib.compress

22

_compress = zlib.compress

23

_decompress = zlib.decompress

23

_decompress = zlib.decompress

24

_sha = util.sha1

24

_sha = util.sha1

25

26

# revlog header flags

26

# revlog header flags

27

REVLOGV0 = 0

27

REVLOGV0 = 0

28

REVLOGNG = 1

28

REVLOGNG = 1

29

REVLOGNGINLINEDATA = (1 << 16)

29

REVLOGNGINLINEDATA = (1 << 16)

30

REVLOGGENERALDELTA = (1 << 17)

30

REVLOGGENERALDELTA = (1 << 17)

31

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

31

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

32

REVLOG_DEFAULT_FORMAT = REVLOGNG

32

REVLOG_DEFAULT_FORMAT = REVLOGNG

33

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

33

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

34

REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGGENERALDELTA

34

REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGGENERALDELTA

35

36

# revlog index flags

36

# revlog index flags

37

REVIDX_KNOWN_FLAGS = 0

37

REVIDX_KNOWN_FLAGS = 0

38

39

# max size of revlog with inline data

39

# max size of revlog with inline data

40

_maxinline = 131072

40

_maxinline = 131072

41

_chunksize = 1048576

41

_chunksize = 1048576

42

43

RevlogError = error.RevlogError

43

RevlogError = error.RevlogError

44

LookupError = error.LookupError

44

LookupError = error.LookupError

45

46

def getoffset(q):

46

def getoffset(q):

47

return int(q >> 16)

47

return int(q >> 16)

48

49

def gettype(q):

49

def gettype(q):

50

return int(q & 0xFFFF)

50

return int(q & 0xFFFF)

51

52

def offset_type(offset, type):

52

def offset_type(offset, type):

53

return long(long(offset) << 16 | type)

53

return long(long(offset) << 16 | type)

54

55

_nullhash = _sha(nullid)

55

_nullhash = _sha(nullid)

56

57

def hash(text, p1, p2):

57

def hash(text, p1, p2):

58

"""generate a hash from the given text and its parent hashes

58

"""generate a hash from the given text and its parent hashes

59

60

This hash combines both the current file contents and its history

60

This hash combines both the current file contents and its history

61

in a manner that makes it easy to distinguish nodes with the same

61

in a manner that makes it easy to distinguish nodes with the same

62

content in the revision graph.

62

content in the revision graph.

63

"""

63

"""

64

# As of now, if one of the parent node is null, p2 is null

64

# As of now, if one of the parent node is null, p2 is null

65

if p2 == nullid:

65

if p2 == nullid:

66

# deep copy of a hash is faster than creating one

66

# deep copy of a hash is faster than creating one

67

s = _nullhash.copy()

67

s = _nullhash.copy()

68

s.update(p1)

68

s.update(p1)

69

else:

69

else:

70

# none of the parent nodes are nullid

70

# none of the parent nodes are nullid

71

l = [p1, p2]

71

l = [p1, p2]

72

l.sort()

72

l.sort()

73

s = _sha(l[0])

73

s = _sha(l[0])

74

s.update(l[1])

74

s.update(l[1])

75

s.update(text)

75

s.update(text)

76

return s.digest()

76

return s.digest()

77

78

def decompress(bin):

78

def decompress(bin):

79

""" decompress the given input """

79

""" decompress the given input """

80

if not bin:

80

if not bin:

81

return bin

81

return bin

82

t = bin[0]

82

t = bin[0]

83

if t == '\0':

83

if t == '\0':

84

return bin

84

return bin

85

if t == 'x':

85

if t == 'x':

86

try:

86

try:

87

return _decompress(bin)

87

return _decompress(bin)

88

except zlib.error, e:

88

except zlib.error, e:

89

raise RevlogError(_("revlog decompress error: %s") % str(e))

89

raise RevlogError(_("revlog decompress error: %s") % str(e))

90

if t == 'u':

90

if t == 'u':

91

return bin[1:]

91

return bin[1:]

92

raise RevlogError(_("unknown compression type %r") % t)

92

raise RevlogError(_("unknown compression type %r") % t)

93

94

# index v0:

94

# index v0:

95

# 4 bytes: offset

95

# 4 bytes: offset

96

# 4 bytes: compressed length

96

# 4 bytes: compressed length

97

# 4 bytes: base rev

97

# 4 bytes: base rev

98

# 4 bytes: link rev

98

# 4 bytes: link rev

99

# 32 bytes: parent 1 nodeid

99

# 32 bytes: parent 1 nodeid

100

# 32 bytes: parent 2 nodeid

100

# 32 bytes: parent 2 nodeid

101

# 32 bytes: nodeid

101

# 32 bytes: nodeid

102

indexformatv0 = ">4l20s20s20s"

102

indexformatv0 = ">4l20s20s20s"

103

v0shaoffset = 56

103

v0shaoffset = 56

104

105

class revlogoldio(object):

105

class revlogoldio(object):

106

def __init__(self):

106

def __init__(self):

107

self.size = struct.calcsize(indexformatv0)

107

self.size = struct.calcsize(indexformatv0)

108

109

def parseindex(self, data, inline):

109

def parseindex(self, data, inline):

110

s = self.size

110

s = self.size

111

index = []

111

index = []

112

nodemap = {nullid: nullrev}

112

nodemap = {nullid: nullrev}

113

n = off = 0

113

n = off = 0

114

l = len(data)

114

l = len(data)

115

while off + s <= l:

115

while off + s <= l:

116

cur = data[off:off + s]

116

cur = data[off:off + s]

117

off += s

117

off += s

118

e = _unpack(indexformatv0, cur)

118

e = _unpack(indexformatv0, cur)

119

# transform to revlogv1 format

119

# transform to revlogv1 format

120

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

120

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

121

nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])

121

nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])

122

index.append(e2)

122

index.append(e2)

123

nodemap[e[6]] = n

123

nodemap[e[6]] = n

124

n += 1

124

n += 1

125

126

# add the magic null revision at -1

126

# add the magic null revision at -1

127

index.append((0, 0, 0, -1, -1, -1, -1, nullid))

127

index.append((0, 0, 0, -1, -1, -1, -1, nullid))

128

129

return index, nodemap, None

129

return index, nodemap, None

130

131

def packentry(self, entry, node, version, rev):

131

def packentry(self, entry, node, version, rev):

132

if gettype(entry[0]):

132

if gettype(entry[0]):

133

raise RevlogError(_("index entry flags need RevlogNG"))

133

raise RevlogError(_("index entry flags need RevlogNG"))

134

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

134

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

135

node(entry[5]), node(entry[6]), entry[7])

135

node(entry[5]), node(entry[6]), entry[7])

136

return _pack(indexformatv0, *e2)

136

return _pack(indexformatv0, *e2)

137

138

# index ng:

138

# index ng:

139

# 6 bytes: offset

139

# 6 bytes: offset

140

# 2 bytes: flags

140

# 2 bytes: flags

141

# 4 bytes: compressed length

141

# 4 bytes: compressed length

142

# 4 bytes: uncompressed length

142

# 4 bytes: uncompressed length

143

# 4 bytes: base rev

143

# 4 bytes: base rev

144

# 4 bytes: link rev

144

# 4 bytes: link rev

145

# 4 bytes: parent 1 rev

145

# 4 bytes: parent 1 rev

146

# 4 bytes: parent 2 rev

146

# 4 bytes: parent 2 rev

147

# 32 bytes: nodeid

147

# 32 bytes: nodeid

148

indexformatng = ">Qiiiiii20s12x"

148

indexformatng = ">Qiiiiii20s12x"

149

ngshaoffset = 32

149

ngshaoffset = 32

150

versionformat = ">I"

150

versionformat = ">I"

151

152

class revlogio(object):

152

class revlogio(object):

153

def __init__(self):

153

def __init__(self):

154

self.size = struct.calcsize(indexformatng)

154

self.size = struct.calcsize(indexformatng)

155

156

def parseindex(self, data, inline):

156

def parseindex(self, data, inline):

157

# call the C implementation to parse the index data

157

# call the C implementation to parse the index data

158

index, cache = parsers.parse_index2(data, inline)

158

index, cache = parsers.parse_index2(data, inline)

159

return index, getattr(index, 'nodemap', None), cache

159

return index, getattr(index, 'nodemap', None), cache

160

161

def packentry(self, entry, node, version, rev):

161

def packentry(self, entry, node, version, rev):

162

p = _pack(indexformatng, *entry)

162

p = _pack(indexformatng, *entry)

163

if rev == 0:

163

if rev == 0:

164

p = _pack(versionformat, version) + p[4:]

164

p = _pack(versionformat, version) + p[4:]

165

return p

165

return p

166

167

class revlog(object):

167

class revlog(object):

168

"""

168

"""

169

the underlying revision storage object

169

the underlying revision storage object

170

171

A revlog consists of two parts, an index and the revision data.

171

A revlog consists of two parts, an index and the revision data.

172

173

The index is a file with a fixed record size containing

173

The index is a file with a fixed record size containing

174

information on each revision, including its nodeid (hash), the

174

information on each revision, including its nodeid (hash), the

175

nodeids of its parents, the position and offset of its data within

175

nodeids of its parents, the position and offset of its data within

176

the data file, and the revision it's based on. Finally, each entry

176

the data file, and the revision it's based on. Finally, each entry

177

contains a linkrev entry that can serve as a pointer to external

177

contains a linkrev entry that can serve as a pointer to external

178

data.

178

data.

179

180

The revision data itself is a linear collection of data chunks.

180

The revision data itself is a linear collection of data chunks.

181

Each chunk represents a revision and is usually represented as a

181

Each chunk represents a revision and is usually represented as a

182

delta against the previous chunk. To bound lookup time, runs of

182

delta against the previous chunk. To bound lookup time, runs of

183

deltas are limited to about 2 times the length of the original

183

deltas are limited to about 2 times the length of the original

184

version data. This makes retrieval of a version proportional to

184

version data. This makes retrieval of a version proportional to

185

its size, or O(1) relative to the number of revisions.

185

its size, or O(1) relative to the number of revisions.

186

187

Both pieces of the revlog are written to in an append-only

187

Both pieces of the revlog are written to in an append-only

188

fashion, which means we never need to rewrite a file to insert or

188

fashion, which means we never need to rewrite a file to insert or

189

remove data, and can use some simple techniques to avoid the need

189

remove data, and can use some simple techniques to avoid the need

190

for locking while reading.

190

for locking while reading.

191

"""

191

"""

192

def __init__(self, opener, indexfile):

192

def __init__(self, opener, indexfile):

193

"""

193

"""

194

create a revlog object

194

create a revlog object

195

196

opener is a function that abstracts the file opening operation

196

opener is a function that abstracts the file opening operation

197

and can be used to implement COW semantics or the like.

197

and can be used to implement COW semantics or the like.

198

"""

198

"""

199

self.indexfile = indexfile

199

self.indexfile = indexfile

200

self.datafile = indexfile[:-2] + ".d"

200

self.datafile = indexfile[:-2] + ".d"

201

self.opener = opener

201

self.opener = opener

202

self._cache = None

202

self._cache = None

203

self._basecache = None

203

self._basecache = None

204

self._chunkcache = (0, '')

204

self._chunkcache = (0, '')

205

self._chunkcachesize = 65536

205

self._chunkcachesize = 65536

206

self.index = []

206

self.index = []

207

self._pcache = {}

207

self._pcache = {}

208

self._nodecache = {nullid: nullrev}

208

self._nodecache = {nullid: nullrev}

209

self._nodepos = None

209

self._nodepos = None

210

211

v = REVLOG_DEFAULT_VERSION

211

v = REVLOG_DEFAULT_VERSION

212

opts = getattr(opener, 'options', None)

212

opts = getattr(opener, 'options', None)

213

if opts is not None:

213

if opts is not None:

214

if 'revlogv1' in opts:

214

if 'revlogv1' in opts:

215

if 'generaldelta' in opts:

215

if 'generaldelta' in opts:

216

v |= REVLOGGENERALDELTA

216

v |= REVLOGGENERALDELTA

217

else:

217

else:

218

v = 0

218

v = 0

219

if 'chunkcachesize' in opts:

219

if 'chunkcachesize' in opts:

220

self._chunkcachesize = opts['chunkcachesize']

220

self._chunkcachesize = opts['chunkcachesize']

221

222

if self._chunkcachesize <= 0:

222

if self._chunkcachesize <= 0:

223

raise RevlogError(_('revlog chunk cache size %r is not greater '

223

raise RevlogError(_('revlog chunk cache size %r is not greater '

224

'than 0') % self._chunkcachesize)

224

'than 0') % self._chunkcachesize)

225

elif self._chunkcachesize & (self._chunkcachesize - 1):

225

elif self._chunkcachesize & (self._chunkcachesize - 1):

226

raise RevlogError(_('revlog chunk cache size %r is not a power '

226

raise RevlogError(_('revlog chunk cache size %r is not a power '

227

'of 2') % self._chunkcachesize)

227

'of 2') % self._chunkcachesize)

228

229

i = ''

229

i = ''

230

self._initempty = True

230

self._initempty = True

231

try:

231

try:

232

f = self.opener(self.indexfile)

232

f = self.opener(self.indexfile)

233

i = f.read()

233

i = f.read()

234

f.close()

234

f.close()

235

if len(i) > 0:

235

if len(i) > 0:

236

v = struct.unpack(versionformat, i[:4])[0]

236

v = struct.unpack(versionformat, i[:4])[0]

237

self._initempty = False

237

self._initempty = False

238

except IOError, inst:

238

except IOError, inst:

239

if inst.errno != errno.ENOENT:

239

if inst.errno != errno.ENOENT:

240

raise

240

raise

241

242

self.version = v

242

self.version = v

243

self._inline = v & REVLOGNGINLINEDATA

243

self._inline = v & REVLOGNGINLINEDATA

244

self._generaldelta = v & REVLOGGENERALDELTA

244

self._generaldelta = v & REVLOGGENERALDELTA

245

flags = v & ~0xFFFF

245

flags = v & ~0xFFFF

246

fmt = v & 0xFFFF

246

fmt = v & 0xFFFF

247

if fmt == REVLOGV0 and flags:

247

if fmt == REVLOGV0 and flags:

248

raise RevlogError(_("index %s unknown flags %#04x for format v0")

248

raise RevlogError(_("index %s unknown flags %#04x for format v0")

249

% (self.indexfile, flags >> 16))

249

% (self.indexfile, flags >> 16))

250

elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:

250

elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:

251

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

251

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

252

% (self.indexfile, flags >> 16))

252

% (self.indexfile, flags >> 16))

253

elif fmt > REVLOGNG:

253

elif fmt > REVLOGNG:

254

raise RevlogError(_("index %s unknown format %d")

254

raise RevlogError(_("index %s unknown format %d")

255

% (self.indexfile, fmt))

255

% (self.indexfile, fmt))

256

257

self._io = revlogio()

257

self._io = revlogio()

258

if self.version == REVLOGV0:

258

if self.version == REVLOGV0:

259

self._io = revlogoldio()

259

self._io = revlogoldio()

260

try:

260

try:

261

d = self._io.parseindex(i, self._inline)

261

d = self._io.parseindex(i, self._inline)

262

except (ValueError, IndexError):

262

except (ValueError, IndexError):

263

raise RevlogError(_("index %s is corrupted") % (self.indexfile))

263

raise RevlogError(_("index %s is corrupted") % (self.indexfile))

264

self.index, nodemap, self._chunkcache = d

264

self.index, nodemap, self._chunkcache = d

265

if nodemap is not None:

265

if nodemap is not None:

266

self.nodemap = self._nodecache = nodemap

266

self.nodemap = self._nodecache = nodemap

267

if not self._chunkcache:

267

if not self._chunkcache:

268

self._chunkclear()

268

self._chunkclear()

269

270

def tip(self):

270

def tip(self):

271

return self.node(len(self.index) - 2)

271

return self.node(len(self.index) - 2)

272

def __len__(self):

272

def __len__(self):

273

return len(self.index) - 1

273

return len(self.index) - 1

274

def __iter__(self):

274

def __iter__(self):

275

return iter(xrange(len(self)))

275

return iter(xrange(len(self)))

276

def revs(self, start=0, stop=None):

276

def revs(self, start=0, stop=None):

277

"""iterate over all rev in this revlog (from start to stop)"""

277

"""iterate over all rev in this revlog (from start to stop)"""

278

step = 1

278

step = 1

279

if stop is not None:

279

if stop is not None:

280

if start > stop:

280

if start > stop:

281

step = -1

281

step = -1

282

stop += step

282

stop += step

283

else:

283

else:

284

stop = len(self)

284

stop = len(self)

285

return xrange(start, stop, step)

285

return xrange(start, stop, step)

286

287

@util.propertycache

287

@util.propertycache

288

def nodemap(self):

288

def nodemap(self):

289

self.rev(self.node(0))

289

self.rev(self.node(0))

290

return self._nodecache

290

return self._nodecache

291

292

def hasnode(self, node):

292

def hasnode(self, node):

293

try:

293

try:

294

self.rev(node)

294

self.rev(node)

295

return True

295

return True

296

except KeyError:

296

except KeyError:

297

return False

297

return False

298

299

def clearcaches(self):

299

def clearcaches(self):

300

try:

300

try:

301

self._nodecache.clearcaches()

301

self._nodecache.clearcaches()

302

except AttributeError:

302

except AttributeError:

303

self._nodecache = {nullid: nullrev}

303

self._nodecache = {nullid: nullrev}

304

self._nodepos = None

304

self._nodepos = None

305

306

def rev(self, node):

306

def rev(self, node):

307

try:

307

try:

308

return self._nodecache[node]

308

return self._nodecache[node]

309

except TypeError:

309

except TypeError:

310

raise

310

raise

311

except RevlogError:

311

except RevlogError:

312

# parsers.c radix tree lookup failed

312

# parsers.c radix tree lookup failed

313

raise LookupError(node, self.indexfile, _('no node'))

313

raise LookupError(node, self.indexfile, _('no node'))

314

except KeyError:

314

except KeyError:

315

# pure python cache lookup failed

315

# pure python cache lookup failed

316

n = self._nodecache

316

n = self._nodecache

317

i = self.index

317

i = self.index

318

p = self._nodepos

318

p = self._nodepos

319

if p is None:

319

if p is None:

320

p = len(i) - 2

320

p = len(i) - 2

321

for r in xrange(p, -1, -1):

321

for r in xrange(p, -1, -1):

322

v = i[r][7]

322

v = i[r][7]

323

n[v] = r

323

n[v] = r

324

if v == node:

324

if v == node:

325

self._nodepos = r - 1

325

self._nodepos = r - 1

326

return r

326

return r

327

raise LookupError(node, self.indexfile, _('no node'))

327

raise LookupError(node, self.indexfile, _('no node'))

328

329

def node(self, rev):

329

def node(self, rev):

330

return self.index[rev][7]

330

return self.index[rev][7]

331

def linkrev(self, rev):

331

def linkrev(self, rev):

332

return self.index[rev][4]

332

return self.index[rev][4]

333

def parents(self, node):

333

def parents(self, node):

334

i = self.index

334

i = self.index

335

d = i[self.rev(node)]

335

d = i[self.rev(node)]

336

return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline

336

return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline

337

def parentrevs(self, rev):

337

def parentrevs(self, rev):

338

return self.index[rev][5:7]

338

return self.index[rev][5:7]

339

def start(self, rev):

339

def start(self, rev):

340

return int(self.index[rev][0] >> 16)

340

return int(self.index[rev][0] >> 16)

341

def end(self, rev):

341

def end(self, rev):

342

return self.start(rev) + self.length(rev)

342

return self.start(rev) + self.length(rev)

343

def length(self, rev):

343

def length(self, rev):

344

return self.index[rev][1]

344

return self.index[rev][1]

345

def chainbase(self, rev):

345

def chainbase(self, rev):

346

index = self.index

346

index = self.index

347

base = index[rev][3]

347

base = index[rev][3]

348

while base != rev:

348

while base != rev:

349

rev = base

349

rev = base

350

base = index[rev][3]

350

base = index[rev][3]

351

return base

351

return base

352

def flags(self, rev):

352

def flags(self, rev):

353

return self.index[rev][0] & 0xFFFF

353

return self.index[rev][0] & 0xFFFF

354

def rawsize(self, rev):

354

def rawsize(self, rev):

355

"""return the length of the uncompressed text for a given revision"""

355

"""return the length of the uncompressed text for a given revision"""

356

l = self.index[rev][2]

356

l = self.index[rev][2]

357

if l >= 0:

357

if l >= 0:

358

return l

358

return l

359

360

t = self.revision(self.node(rev))

360

t = self.revision(self.node(rev))

361

return len(t)

361

return len(t)

362

size = rawsize

362

size = rawsize

363

364

def ancestors(self, revs, stoprev=0, inclusive=False):

364

def ancestors(self, revs, stoprev=0, inclusive=False):

365

"""Generate the ancestors of 'revs' in reverse topological order.

365

"""Generate the ancestors of 'revs' in reverse topological order.

366

Does not generate revs lower than stoprev.

366

Does not generate revs lower than stoprev.

367

368

See the documentation for ancestor.lazyancestors for more details."""

368

See the documentation for ancestor.lazyancestors for more details."""

369

370

return ancestor.lazyancestors(self, revs, stoprev=stoprev,

370

return ancestor.lazyancestors(self, revs, stoprev=stoprev,

371

inclusive=inclusive)

371

inclusive=inclusive)

372

373

def descendants(self, revs):

373

def descendants(self, revs):

374

"""Generate the descendants of 'revs' in revision order.

374

"""Generate the descendants of 'revs' in revision order.

375

376

Yield a sequence of revision numbers starting with a child of

376

Yield a sequence of revision numbers starting with a child of

377

some rev in revs, i.e., each revision is *not* considered a

377

some rev in revs, i.e., each revision is *not* considered a

378

descendant of itself. Results are ordered by revision number (a

378

descendant of itself. Results are ordered by revision number (a

379

topological sort)."""

379

topological sort)."""

380

first = min(revs)

380

first = min(revs)

381

if first == nullrev:

381

if first == nullrev:

382

for i in self:

382

for i in self:

383

yield i

383

yield i

384

return

384

return

385

386

seen = set(revs)

386

seen = set(revs)

387

for i in self.revs(start=first + 1):

387

for i in self.revs(start=first + 1):

388

for x in self.parentrevs(i):

388

for x in self.parentrevs(i):

389

if x != nullrev and x in seen:

389

if x != nullrev and x in seen:

390

seen.add(i)

390

seen.add(i)

391

yield i

391

yield i

392

break

392

break

393

394

def findcommonmissing(self, common=None, heads=None):

394

def findcommonmissing(self, common=None, heads=None):

395

"""Return a tuple of the ancestors of common and the ancestors of heads

395

"""Return a tuple of the ancestors of common and the ancestors of heads

396

that are not ancestors of common. In revset terminology, we return the

396

that are not ancestors of common. In revset terminology, we return the

397

tuple:

397

tuple:

398

399

::common, (::heads) - (::common)

399

::common, (::heads) - (::common)

400

401

The list is sorted by revision number, meaning it is

401

The list is sorted by revision number, meaning it is

402

topologically sorted.

402

topologically sorted.

403

404

'heads' and 'common' are both lists of node IDs. If heads is

404

'heads' and 'common' are both lists of node IDs. If heads is

405

not supplied, uses all of the revlog's heads. If common is not

405

not supplied, uses all of the revlog's heads. If common is not

406

supplied, uses nullid."""

406

supplied, uses nullid."""

407

if common is None:

407

if common is None:

408

common = [nullid]

408

common = [nullid]

409

if heads is None:

409

if heads is None:

410

heads = self.heads()

410

heads = self.heads()

411

412

common = [self.rev(n) for n in common]

412

common = [self.rev(n) for n in common]

413

heads = [self.rev(n) for n in heads]

413

heads = [self.rev(n) for n in heads]

414

415

# we want the ancestors, but inclusive

415

# we want the ancestors, but inclusive

416

class lazyset(object):

416

class lazyset(object):

417

def __init__(self, lazyvalues):

417

def __init__(self, lazyvalues):

418

self.addedvalues = set()

418

self.addedvalues = set()

419

self.lazyvalues = lazyvalues

419

self.lazyvalues = lazyvalues

420

421

def __contains__(self, value):

421

def __contains__(self, value):

422

return value in self.addedvalues or value in self.lazyvalues

422

return value in self.addedvalues or value in self.lazyvalues

423

424

def __iter__(self):

424

def __iter__(self):

425

added = self.addedvalues

425

added = self.addedvalues

426

for r in added:

426

for r in added:

427

yield r

427

yield r

428

for r in self.lazyvalues:

428

for r in self.lazyvalues:

429

if not r in added:

429

if not r in added:

430

yield r

430

yield r

431

432

def add(self, value):

432

def add(self, value):

433

self.addedvalues.add(value)

433

self.addedvalues.add(value)

434

435

def update(self, values):

435

def update(self, values):

436

self.addedvalues.update(values)

436

self.addedvalues.update(values)

437

438

has = lazyset(self.ancestors(common))

438

has = lazyset(self.ancestors(common))

439

has.add(nullrev)

439

has.add(nullrev)

440

has.update(common)

440

has.update(common)

441

442

# take all ancestors from heads that aren't in has

442

# take all ancestors from heads that aren't in has

443

missing = set()

443

missing = set()

444

visit = util.deque(r for r in heads if r not in has)

444

visit = util.deque(r for r in heads if r not in has)

445

while visit:

445

while visit:

446

r = visit.popleft()

446

r = visit.popleft()

447

if r in missing:

447

if r in missing:

448

continue

448

continue

449

else:

449

else:

450

missing.add(r)

450

missing.add(r)

451

for p in self.parentrevs(r):

451

for p in self.parentrevs(r):

452

if p not in has:

452

if p not in has:

453

visit.append(p)

453

visit.append(p)

454

missing = list(missing)

454

missing = list(missing)

455

missing.sort()

455

missing.sort()

456

return has, [self.node(r) for r in missing]

456

return has, [self.node(r) for r in missing]

457

458

def findmissingrevs(self, common=None, heads=None):

458

def findmissingrevs(self, common=None, heads=None):

459

"""Return the revision numbers of the ancestors of heads that

459

"""Return the revision numbers of the ancestors of heads that

460

are not ancestors of common.

460

are not ancestors of common.

461

462

More specifically, return a list of revision numbers corresponding to

462

More specifically, return a list of revision numbers corresponding to

463

nodes N such that every N satisfies the following constraints:

463

nodes N such that every N satisfies the following constraints:

464

465

1. N is an ancestor of some node in 'heads'

465

1. N is an ancestor of some node in 'heads'

466

2. N is not an ancestor of any node in 'common'

466

2. N is not an ancestor of any node in 'common'

467

468

The list is sorted by revision number, meaning it is

468

The list is sorted by revision number, meaning it is

469

topologically sorted.

469

topologically sorted.

470

471

'heads' and 'common' are both lists of revision numbers. If heads is

471

'heads' and 'common' are both lists of revision numbers. If heads is

472

not supplied, uses all of the revlog's heads. If common is not

472

not supplied, uses all of the revlog's heads. If common is not

473

supplied, uses nullid."""

473

supplied, uses nullid."""

474

if common is None:

474

if common is None:

475

common = [nullrev]

475

common = [nullrev]

476

if heads is None:

476

if heads is None:

477

heads = self.headrevs()

477

heads = self.headrevs()

478

479

return ancestor.missingancestors(heads, common, self.parentrevs)

479

return ancestor.missingancestors(heads, common, self.parentrevs)

480

481

def findmissing(self, common=None, heads=None):

481

def findmissing(self, common=None, heads=None):

482

"""Return the ancestors of heads that are not ancestors of common.

482

"""Return the ancestors of heads that are not ancestors of common.

483

484

More specifically, return a list of nodes N such that every N

484

More specifically, return a list of nodes N such that every N

485

satisfies the following constraints:

485

satisfies the following constraints:

486

487

1. N is an ancestor of some node in 'heads'

487

1. N is an ancestor of some node in 'heads'

488

2. N is not an ancestor of any node in 'common'

488

2. N is not an ancestor of any node in 'common'

489

490

The list is sorted by revision number, meaning it is

490

The list is sorted by revision number, meaning it is

491

topologically sorted.

491

topologically sorted.

492

493

'heads' and 'common' are both lists of node IDs. If heads is

493

'heads' and 'common' are both lists of node IDs. If heads is

494

not supplied, uses all of the revlog's heads. If common is not

494

not supplied, uses all of the revlog's heads. If common is not

495

supplied, uses nullid."""

495

supplied, uses nullid."""

496

if common is None:

496

if common is None:

497

common = [nullid]

497

common = [nullid]

498

if heads is None:

498

if heads is None:

499

heads = self.heads()

499

heads = self.heads()

500

501

common = [self.rev(n) for n in common]

501

common = [self.rev(n) for n in common]

502

heads = [self.rev(n) for n in heads]

502

heads = [self.rev(n) for n in heads]

503

504

return [self.node(r) for r in

504

return [self.node(r) for r in

505

ancestor.missingancestors(heads, common, self.parentrevs)]

505

ancestor.missingancestors(heads, common, self.parentrevs)]

506

507

def nodesbetween(self, roots=None, heads=None):

507

def nodesbetween(self, roots=None, heads=None):

508

"""Return a topological path from 'roots' to 'heads'.

508

"""Return a topological path from 'roots' to 'heads'.

509

510

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

510

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

511

topologically sorted list of all nodes N that satisfy both of

511

topologically sorted list of all nodes N that satisfy both of

512

these constraints:

512

these constraints:

513

514

1. N is a descendant of some node in 'roots'

514

1. N is a descendant of some node in 'roots'

515

2. N is an ancestor of some node in 'heads'

515

2. N is an ancestor of some node in 'heads'

516

517

Every node is considered to be both a descendant and an ancestor

517

Every node is considered to be both a descendant and an ancestor

518

of itself, so every reachable node in 'roots' and 'heads' will be

518

of itself, so every reachable node in 'roots' and 'heads' will be

519

included in 'nodes'.

519

included in 'nodes'.

520

521

'outroots' is the list of reachable nodes in 'roots', i.e., the

521

'outroots' is the list of reachable nodes in 'roots', i.e., the

522

subset of 'roots' that is returned in 'nodes'. Likewise,

522

subset of 'roots' that is returned in 'nodes'. Likewise,

523

'outheads' is the subset of 'heads' that is also in 'nodes'.

523

'outheads' is the subset of 'heads' that is also in 'nodes'.

524

525

'roots' and 'heads' are both lists of node IDs. If 'roots' is

525

'roots' and 'heads' are both lists of node IDs. If 'roots' is

526

unspecified, uses nullid as the only root. If 'heads' is

526

unspecified, uses nullid as the only root. If 'heads' is

527

unspecified, uses list of all of the revlog's heads."""

527

unspecified, uses list of all of the revlog's heads."""

528

nonodes = ([], [], [])

528

nonodes = ([], [], [])

529

if roots is not None:

529

if roots is not None:

530

roots = list(roots)

530

roots = list(roots)

531

if not roots:

531

if not roots:

532

return nonodes

532

return nonodes

533

lowestrev = min([self.rev(n) for n in roots])

533

lowestrev = min([self.rev(n) for n in roots])

534

else:

534

else:

535

roots = [nullid] # Everybody's a descendant of nullid

535

roots = [nullid] # Everybody's a descendant of nullid

536

lowestrev = nullrev

536

lowestrev = nullrev

537

if (lowestrev == nullrev) and (heads is None):

537

if (lowestrev == nullrev) and (heads is None):

538

# We want _all_ the nodes!

538

# We want _all_ the nodes!

539

return ([self.node(r) for r in self], [nullid], list(self.heads()))

539

return ([self.node(r) for r in self], [nullid], list(self.heads()))

540

if heads is None:

540

if heads is None:

541

# All nodes are ancestors, so the latest ancestor is the last

541

# All nodes are ancestors, so the latest ancestor is the last

542

# node.

542

# node.

543

highestrev = len(self) - 1

543

highestrev = len(self) - 1

544

# Set ancestors to None to signal that every node is an ancestor.

544

# Set ancestors to None to signal that every node is an ancestor.

545

ancestors = None

545

ancestors = None

546

# Set heads to an empty dictionary for later discovery of heads

546

# Set heads to an empty dictionary for later discovery of heads

547

heads = {}

547

heads = {}

548

else:

548

else:

549

heads = list(heads)

549

heads = list(heads)

550

if not heads:

550

if not heads:

551

return nonodes

551

return nonodes

552

ancestors = set()

552

ancestors = set()

553

# Turn heads into a dictionary so we can remove 'fake' heads.

553

# Turn heads into a dictionary so we can remove 'fake' heads.

554

# Also, later we will be using it to filter out the heads we can't

554

# Also, later we will be using it to filter out the heads we can't

555

# find from roots.

555

# find from roots.

556

heads = dict.fromkeys(heads, False)

556

heads = dict.fromkeys(heads, False)

557

# Start at the top and keep marking parents until we're done.

557

# Start at the top and keep marking parents until we're done.

558

nodestotag = set(heads)

558

nodestotag = set(heads)

559

# Remember where the top was so we can use it as a limit later.

559

# Remember where the top was so we can use it as a limit later.

560

highestrev = max([self.rev(n) for n in nodestotag])

560

highestrev = max([self.rev(n) for n in nodestotag])

561

while nodestotag:

561

while nodestotag:

562

# grab a node to tag

562

# grab a node to tag

563

n = nodestotag.pop()

563

n = nodestotag.pop()

564

# Never tag nullid

564

# Never tag nullid

565

if n == nullid:

565

if n == nullid:

566

continue

566

continue

567

# A node's revision number represents its place in a

567

# A node's revision number represents its place in a

568

# topologically sorted list of nodes.

568

# topologically sorted list of nodes.

569

r = self.rev(n)

569

r = self.rev(n)

570

if r >= lowestrev:

570

if r >= lowestrev:

571

if n not in ancestors:

571

if n not in ancestors:

572

# If we are possibly a descendant of one of the roots

572

# If we are possibly a descendant of one of the roots

573

# and we haven't already been marked as an ancestor

573

# and we haven't already been marked as an ancestor

574

ancestors.add(n) # Mark as ancestor

574

ancestors.add(n) # Mark as ancestor

575

# Add non-nullid parents to list of nodes to tag.

575

# Add non-nullid parents to list of nodes to tag.

576

nodestotag.update([p for p in self.parents(n) if

576

nodestotag.update([p for p in self.parents(n) if

577

p != nullid])

577

p != nullid])

578

elif n in heads: # We've seen it before, is it a fake head?

578

elif n in heads: # We've seen it before, is it a fake head?

579

# So it is, real heads should not be the ancestors of

579

# So it is, real heads should not be the ancestors of

580

# any other heads.

580

# any other heads.

581

heads.pop(n)

581

heads.pop(n)

582

if not ancestors:

582

if not ancestors:

583

return nonodes

583

return nonodes

584

# Now that we have our set of ancestors, we want to remove any

584

# Now that we have our set of ancestors, we want to remove any

585

# roots that are not ancestors.

585

# roots that are not ancestors.

586

587

# If one of the roots was nullid, everything is included anyway.

587

# If one of the roots was nullid, everything is included anyway.

588

if lowestrev > nullrev:

588

if lowestrev > nullrev:

589

# But, since we weren't, let's recompute the lowest rev to not

589

# But, since we weren't, let's recompute the lowest rev to not

590

# include roots that aren't ancestors.

590

# include roots that aren't ancestors.

591

592

# Filter out roots that aren't ancestors of heads

592

# Filter out roots that aren't ancestors of heads

593

roots = [n for n in roots if n in ancestors]

593

roots = [n for n in roots if n in ancestors]

594

# Recompute the lowest revision

594

# Recompute the lowest revision

595

if roots:

595

if roots:

596

lowestrev = min([self.rev(n) for n in roots])

596

lowestrev = min([self.rev(n) for n in roots])

597

else:

597

else:

598

# No more roots? Return empty list

598

# No more roots? Return empty list

599

return nonodes

599

return nonodes

600

else:

600

else:

601

# We are descending from nullid, and don't need to care about

601

# We are descending from nullid, and don't need to care about

602

# any other roots.

602

# any other roots.

603

lowestrev = nullrev

603

lowestrev = nullrev

604

roots = [nullid]

604

roots = [nullid]

605

# Transform our roots list into a set.

605

# Transform our roots list into a set.

606

descendants = set(roots)

606

descendants = set(roots)

607

# Also, keep the original roots so we can filter out roots that aren't

607

# Also, keep the original roots so we can filter out roots that aren't

608

# 'real' roots (i.e. are descended from other roots).

608

# 'real' roots (i.e. are descended from other roots).

609

roots = descendants.copy()

609

roots = descendants.copy()

610

# Our topologically sorted list of output nodes.

610

# Our topologically sorted list of output nodes.

611

orderedout = []

611

orderedout = []

612

# Don't start at nullid since we don't want nullid in our output list,

612

# Don't start at nullid since we don't want nullid in our output list,

613

# and if nullid shows up in descendants, empty parents will look like

613

# and if nullid shows up in descendants, empty parents will look like

614

# they're descendants.

614

# they're descendants.

615

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

615

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

616

n = self.node(r)

616

n = self.node(r)

617

isdescendant = False

617

isdescendant = False

618

if lowestrev == nullrev: # Everybody is a descendant of nullid

618

if lowestrev == nullrev: # Everybody is a descendant of nullid

619

isdescendant = True

619

isdescendant = True

620

elif n in descendants:

620

elif n in descendants:

621

# n is already a descendant

621

# n is already a descendant

622

isdescendant = True

622

isdescendant = True

623

# This check only needs to be done here because all the roots

623

# This check only needs to be done here because all the roots

624

# will start being marked is descendants before the loop.

624

# will start being marked is descendants before the loop.

625

if n in roots:

625

if n in roots:

626

# If n was a root, check if it's a 'real' root.

626

# If n was a root, check if it's a 'real' root.

627

p = tuple(self.parents(n))

627

p = tuple(self.parents(n))

628

# If any of its parents are descendants, it's not a root.

628

# If any of its parents are descendants, it's not a root.

629

if (p[0] in descendants) or (p[1] in descendants):

629

if (p[0] in descendants) or (p[1] in descendants):

630

roots.remove(n)

630

roots.remove(n)

631

else:

631

else:

632

p = tuple(self.parents(n))

632

p = tuple(self.parents(n))

633

# A node is a descendant if either of its parents are

633

# A node is a descendant if either of its parents are

634

# descendants. (We seeded the dependents list with the roots

634

# descendants. (We seeded the dependents list with the roots

635

# up there, remember?)

635

# up there, remember?)

636

if (p[0] in descendants) or (p[1] in descendants):

636

if (p[0] in descendants) or (p[1] in descendants):

637

descendants.add(n)

637

descendants.add(n)

638

isdescendant = True

638

isdescendant = True

639

if isdescendant and ((ancestors is None) or (n in ancestors)):

639

if isdescendant and ((ancestors is None) or (n in ancestors)):

640

# Only include nodes that are both descendants and ancestors.

640

# Only include nodes that are both descendants and ancestors.

641

orderedout.append(n)

641

orderedout.append(n)

642

if (ancestors is not None) and (n in heads):

642

if (ancestors is not None) and (n in heads):

643

# We're trying to figure out which heads are reachable

643

# We're trying to figure out which heads are reachable

644

# from roots.

644

# from roots.

645

# Mark this head as having been reached

645

# Mark this head as having been reached

646

heads[n] = True

646

heads[n] = True

647

elif ancestors is None:

647

elif ancestors is None:

648

# Otherwise, we're trying to discover the heads.

648

# Otherwise, we're trying to discover the heads.

649

# Assume this is a head because if it isn't, the next step

649

# Assume this is a head because if it isn't, the next step

650

# will eventually remove it.

650

# will eventually remove it.

651

heads[n] = True

651

heads[n] = True

652

# But, obviously its parents aren't.

652

# But, obviously its parents aren't.

653

for p in self.parents(n):

653

for p in self.parents(n):

654

heads.pop(p, None)

654

heads.pop(p, None)

655

heads = [n for n, flag in heads.iteritems() if flag]

655

heads = [n for n, flag in heads.iteritems() if flag]

656

roots = list(roots)

656

roots = list(roots)

657

assert orderedout

657

assert orderedout

658

assert roots

658

assert roots

659

assert heads

659

assert heads

660

return (orderedout, roots, heads)

660

return (orderedout, roots, heads)

661

662

def headrevs(self):

662

def headrevs(self):

663

try:

663

try:

664

return self.index.headrevs()

664

return self.index.headrevs()

665

except AttributeError:

665

except AttributeError:

666

return self._headrevs()

666

return self._headrevs()

667

668

def _headrevs(self):

668

def _headrevs(self):

669

count = len(self)

669

count = len(self)

670

if not count:

670

if not count:

671

return [nullrev]

671

return [nullrev]

672

# we won't iter over filtered rev so nobody is a head at start

672

# we won't iter over filtered rev so nobody is a head at start

673

ishead = [0] * (count + 1)

673

ishead = [0] * (count + 1)

674

index = self.index

674

index = self.index

675

for r in self:

675

for r in self:

676

ishead[r] = 1 # I may be an head

676

ishead[r] = 1 # I may be an head

677

e = index[r]

677

e = index[r]

678

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

678

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

679

return [r for r, val in enumerate(ishead) if val]

679

return [r for r, val in enumerate(ishead) if val]

680

681

def heads(self, start=None, stop=None):

681

def heads(self, start=None, stop=None):

682

"""return the list of all nodes that have no children

682

"""return the list of all nodes that have no children

683

684

if start is specified, only heads that are descendants of

684

if start is specified, only heads that are descendants of

685

start will be returned

685

start will be returned

686

if stop is specified, it will consider all the revs from stop

686

if stop is specified, it will consider all the revs from stop

687

as if they had no children

687

as if they had no children

688

"""

688

"""

689

if start is None and stop is None:

689

if start is None and stop is None:

690

if not len(self):

690

if not len(self):

691

return [nullid]

691

return [nullid]

692

return [self.node(r) for r in self.headrevs()]

692

return [self.node(r) for r in self.headrevs()]

693

694

if start is None:

694

if start is None:

695

start = nullid

695

start = nullid

696

if stop is None:

696

if stop is None:

697

stop = []

697

stop = []

698

stoprevs = set([self.rev(n) for n in stop])

698

stoprevs = set([self.rev(n) for n in stop])

699

startrev = self.rev(start)

699

startrev = self.rev(start)

700

reachable = set((startrev,))

700

reachable = set((startrev,))

701

heads = set((startrev,))

701

heads = set((startrev,))

702

703

parentrevs = self.parentrevs

703

parentrevs = self.parentrevs

704

for r in self.revs(start=startrev + 1):

704

for r in self.revs(start=startrev + 1):

705

for p in parentrevs(r):

705

for p in parentrevs(r):

706

if p in reachable:

706

if p in reachable:

707

if r not in stoprevs:

707

if r not in stoprevs:

708

reachable.add(r)

708

reachable.add(r)

709

heads.add(r)

709

heads.add(r)

710

if p in heads and p not in stoprevs:

710

if p in heads and p not in stoprevs:

711

heads.remove(p)

711

heads.remove(p)

712

713

return [self.node(r) for r in heads]

713

return [self.node(r) for r in heads]

714

715

def children(self, node):

715

def children(self, node):

716

"""find the children of a given node"""

716

"""find the children of a given node"""

717

c = []

717

c = []

718

p = self.rev(node)

718

p = self.rev(node)

719

for r in self.revs(start=p + 1):

719

for r in self.revs(start=p + 1):

720

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

720

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

721

if prevs:

721

if prevs:

722

for pr in prevs:

722

for pr in prevs:

723

if pr == p:

723

if pr == p:

724

c.append(self.node(r))

724

c.append(self.node(r))

725

elif p == nullrev:

725

elif p == nullrev:

726

c.append(self.node(r))

726

c.append(self.node(r))

727

return c

727

return c

728

729

def descendant(self, start, end):

729

def descendant(self, start, end):

730

if start == nullrev:

730

if start == nullrev:

731

return True

731

return True

732

for i in self.descendants([start]):

732

for i in self.descendants([start]):

733

if i == end:

733

if i == end:

734

return True

734

return True

735

elif i > end:

735

elif i > end:

736

break

736

break

737

return False

737

return False

738

739

def commonancestorsheads(self, a, b):

739

def commonancestorsheads(self, a, b):

740

"""calculate all the heads of the common ancestors of nodes a and b"""

740

"""calculate all the heads of the common ancestors of nodes a and b"""

741

a, b = self.rev(a), self.rev(b)

741

a, b = self.rev(a), self.rev(b)

742

try:

742

try:

743

ancs = self.index.commonancestorsheads(a, b)

743

ancs = self.index.commonancestorsheads(a, b)

744

except (AttributeError, OverflowError): # C implementation failed

744

except (AttributeError, OverflowError): # C implementation failed

745

ancs = ancestor.commonancestorsheads(self.parentrevs, a, b)

745

ancs = ancestor.commonancestorsheads(self.parentrevs, a, b)

746

return map(self.node, ancs)

746

return map(self.node, ancs)

747

748

def isancestor(self, a, b):

748

def isancestor(self, a, b):

749

"""return True if node a is an ancestor of node b

749

"""return True if node a is an ancestor of node b

750

751

The implementation of this is trivial but the use of

751

The implementation of this is trivial but the use of

752

commonancestorsheads is not."""

752

commonancestorsheads is not."""

753

return a in self.commonancestorsheads(a, b)

753

return a in self.commonancestorsheads(a, b)

754

755

def ancestor(self, a, b):

755

def ancestor(self, a, b):

756

"""calculate the "best" common ancestor of nodes a and b"""

756

"""calculate the "best" common ancestor of nodes a and b"""

757

758

a, b = self.rev(a), self.rev(b)

758

a, b = self.rev(a), self.rev(b)

759

try:

759

try:

760

ancs = self.index.ancestors(a, b)

760

ancs = self.index.ancestors(a, b)

761

except (AttributeError, OverflowError):

761

except (AttributeError, OverflowError):

762

ancs = ancestor.ancestors(self.parentrevs, a, b)

762

ancs = ancestor.ancestors(self.parentrevs, a, b)

763

if ancs:

763

if ancs:

764

# choose a consistent winner when there's a tie

764

# choose a consistent winner when there's a tie

765

return min(map(self.node, ancs))

765

return min(map(self.node, ancs))

766

return nullid

766

return nullid

767

768

def _match(self, id):

768

def _match(self, id):

769

if isinstance(id, int):

769

if isinstance(id, int):

770

# rev

770

# rev

771

return self.node(id)

771

return self.node(id)

772

if len(id) == 20:

772

if len(id) == 20:

773

# possibly a binary node

773

# possibly a binary node

774

# odds of a binary node being all hex in ASCII are 1 in 10**25

774

# odds of a binary node being all hex in ASCII are 1 in 10**25

775

try:

775

try:

776

node = id

776

node = id

777

self.rev(node) # quick search the index

777

self.rev(node) # quick search the index

778

return node

778

return node

779

except LookupError:

779

except LookupError:

780

pass # may be partial hex id

780

pass # may be partial hex id

781

try:

781

try:

782

# str(rev)

782

# str(rev)

783

rev = int(id)

783

rev = int(id)

784

if str(rev) != id:

784

if str(rev) != id:

785

raise ValueError

785

raise ValueError

786

if rev < 0:

786

if rev < 0:

787

rev = len(self) + rev

787

rev = len(self) + rev

788

if rev < 0 or rev >= len(self):

788

if rev < 0 or rev >= len(self):

789

raise ValueError

789

raise ValueError

790

return self.node(rev)

790

return self.node(rev)

791

except (ValueError, OverflowError):

791

except (ValueError, OverflowError):

792

pass

792

pass

793

if len(id) == 40:

793

if len(id) == 40:

794

try:

794

try:

795

# a full hex nodeid?

795

# a full hex nodeid?

796

node = bin(id)

796

node = bin(id)

797

self.rev(node)

797

self.rev(node)

798

return node

798

return node

799

except (TypeError, LookupError):

799

except (TypeError, LookupError):

800

pass

800

pass

801

802

def _partialmatch(self, id):

802

def _partialmatch(self, id):

803

try:

803

try:

804

n = self.index.partialmatch(id)

804

n = self.index.partialmatch(id)

805

if n and self.hasnode(n):

805

if n and self.hasnode(n):

806

return n

806

return n

807

return None

807

return None

808

except RevlogError:

808

except RevlogError:

809

# parsers.c radix tree lookup gave multiple matches

809

# parsers.c radix tree lookup gave multiple matches

810

# fall through to slow path that filters hidden revisions

810

# fall through to slow path that filters hidden revisions

811

pass

811

pass

812

except (AttributeError, ValueError):

812

except (AttributeError, ValueError):

813

# we are pure python, or key was too short to search radix tree

813

# we are pure python, or key was too short to search radix tree

814

pass

814

pass

815

816

if id in self._pcache:

816

if id in self._pcache:

817

return self._pcache[id]

817

return self._pcache[id]

818

819

if len(id) < 40:

819

if len(id) < 40:

820

try:

820

try:

821

# hex(node)[:...]

821

# hex(node)[:...]

822

l = len(id) // 2 # grab an even number of digits

822

l = len(id) // 2 # grab an even number of digits

823

prefix = bin(id[:l * 2])

823

prefix = bin(id[:l * 2])

824

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

824

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

825

nl = [n for n in nl if hex(n).startswith(id) and

825

nl = [n for n in nl if hex(n).startswith(id) and

826

self.hasnode(n)]

826

self.hasnode(n)]

827

if len(nl) > 0:

827

if len(nl) > 0:

828

if len(nl) == 1:

828

if len(nl) == 1:

829

self._pcache[id] = nl[0]

829

self._pcache[id] = nl[0]

830

return nl[0]

830

return nl[0]

831

raise LookupError(id, self.indexfile,

831

raise LookupError(id, self.indexfile,

832

_('ambiguous identifier'))

832

_('ambiguous identifier'))

833

return None

833

return None

834

except TypeError:

834

except TypeError:

835

pass

835

pass

836

837

def lookup(self, id):

837

def lookup(self, id):

838

"""locate a node based on:

838

"""locate a node based on:

839

- revision number or str(revision number)

839

- revision number or str(revision number)

840

- nodeid or subset of hex nodeid

840

- nodeid or subset of hex nodeid

841

"""

841

"""

842

n = self._match(id)

842

n = self._match(id)

843

if n is not None:

843

if n is not None:

844

return n

844

return n

845

n = self._partialmatch(id)

845

n = self._partialmatch(id)

846

if n:

846

if n:

847

return n

847

return n

848

849

raise LookupError(id, self.indexfile, _('no match found'))

849

raise LookupError(id, self.indexfile, _('no match found'))

850

851

def cmp(self, node, text):

851

def cmp(self, node, text):

852

"""compare text with a given file revision

852

"""compare text with a given file revision

853

854

returns True if text is different than what is stored.

854

returns True if text is different than what is stored.

855

"""

855

"""

856

p1, p2 = self.parents(node)

856

p1, p2 = self.parents(node)

857

return hash(text, p1, p2) != node

857

return hash(text, p1, p2) != node

858

859

def _addchunk(self, offset, data):

859

def _addchunk(self, offset, data):

860

o, d = self._chunkcache

860

o, d = self._chunkcache

861

# try to add to existing cache

861

# try to add to existing cache

862

if o + len(d) == offset and len(d) + len(data) < _chunksize:

862

if o + len(d) == offset and len(d) + len(data) < _chunksize:

863

self._chunkcache = o, d + data

863

self._chunkcache = o, d + data

864

else:

864

else:

865

self._chunkcache = offset, data

865

self._chunkcache = offset, data

866

867

def _loadchunk(self, offset, length):

867

def _loadchunk(self, offset, length):

868

if self._inline:

868

if self._inline:

869

df = self.opener(self.indexfile)

869

df = self.opener(self.indexfile)

870

else:

870

else:

871

df = self.opener(self.datafile)

871

df = self.opener(self.datafile)

872

873

# Cache data both forward and backward around the requested

873

# Cache data both forward and backward around the requested

874

# data, in a fixed size window. This helps speed up operations

874

# data, in a fixed size window. This helps speed up operations

875

# involving reading the revlog backwards.

875

# involving reading the revlog backwards.

876

cachesize = self._chunkcachesize

876

cachesize = self._chunkcachesize

877

realoffset = offset & ~(cachesize - 1)

877

realoffset = offset & ~(cachesize - 1)

878

reallength = (((offset + length + cachesize) & ~(cachesize - 1))

878

reallength = (((offset + length + cachesize) & ~(cachesize - 1))

879

- realoffset)

879

- realoffset)

880

df.seek(realoffset)

880

df.seek(realoffset)

881

d = df.read(reallength)

881

d = df.read(reallength)

882

df.close()

882

df.close()

883

self._addchunk(realoffset, d)

883

self._addchunk(realoffset, d)

884

if offset != realoffset or reallength != length:

884

if offset != realoffset or reallength != length:

885

return util.buffer(d, offset - realoffset, length)

885

return util.buffer(d, offset - realoffset, length)

886

return d

886

return d

887

888

def _getchunk(self, offset, length):

888

def _getchunk(self, offset, length):

889

o, d = self._chunkcache

889

o, d = self._chunkcache

890

l = len(d)

890

l = len(d)

891

892

# is it in the cache?

892

# is it in the cache?

893

cachestart = offset - o

893

cachestart = offset - o

894

cacheend = cachestart + length

894

cacheend = cachestart + length

895

if cachestart >= 0 and cacheend <= l:

895

if cachestart >= 0 and cacheend <= l:

896

if cachestart == 0 and cacheend == l:

896

if cachestart == 0 and cacheend == l:

897

return d # avoid a copy

897

return d # avoid a copy

898

return util.buffer(d, cachestart, cacheend - cachestart)

898

return util.buffer(d, cachestart, cacheend - cachestart)

899

900

return self._loadchunk(offset, length)

900

return self._loadchunk(offset, length)

901

902

def _chunkraw(self, startrev, endrev):

902

def _chunkraw(self, startrev, endrev):

903

start = self.start(startrev)

903

start = self.start(startrev)

904

end = self.end(endrev)

904

end = self.end(endrev)

905

if self._inline:

905

if self._inline:

906

start += (startrev + 1) * self._io.size

906

start += (startrev + 1) * self._io.size

907

end += (endrev + 1) * self._io.size

907

end += (endrev + 1) * self._io.size

908

length = end - start

908

length = end - start

909

return self._getchunk(start, length)

909

return self._getchunk(start, length)

910

911

def _chunk(self, rev):

911

def _chunk(self, rev):

912

return decompress(self._chunkraw(rev, rev))

912

return decompress(self._chunkraw(rev, rev))

913

914

def _chunks(self, revs):

914

def _chunks(self, revs):

915

'''faster version of [self._chunk(rev) for rev in revs]

915

'''faster version of [self._chunk(rev) for rev in revs]

916

917

Assumes that revs is in ascending order.'''

917

Assumes that revs is in ascending order.'''

918

if not revs:

918

if not revs:

919

return []

919

return []

920

start = self.start

920

start = self.start

921

length = self.length

921

length = self.length

922

inline = self._inline

922

inline = self._inline

923

iosize = self._io.size

923

iosize = self._io.size

924

buffer = util.buffer

924

buffer = util.buffer

925

926

l = []

926

l = []

927

ladd = l.append

927

ladd = l.append

928

929

# preload the cache

929

# preload the cache

930

try:

930

try:

931

while True:

931

while True:

932

# ensure that the cache doesn't change out from under us

932

# ensure that the cache doesn't change out from under us

933

_cache = self._chunkcache

933

_cache = self._chunkcache

934

self._chunkraw(revs[0], revs[-1])

934

self._chunkraw(revs[0], revs[-1])

935

if _cache == self._chunkcache:

935

if _cache == self._chunkcache:

936

break

936

break

937

offset, data = _cache

937

offset, data = _cache

938

except OverflowError:

938

except OverflowError:

939

# issue4215 - we can't cache a run of chunks greater than

939

# issue4215 - we can't cache a run of chunks greater than

940

# 2G on Windows

940

# 2G on Windows

941

return [self._chunk(rev) for rev in revs]

941

return [self._chunk(rev) for rev in revs]

942

943

for rev in revs:

943

for rev in revs:

944

chunkstart = start(rev)

944

chunkstart = start(rev)

945

if inline:

945

if inline:

946

chunkstart += (rev + 1) * iosize

946

chunkstart += (rev + 1) * iosize

947

chunklength = length(rev)

947

chunklength = length(rev)

948

ladd(decompress(buffer(data, chunkstart - offset, chunklength)))

948

ladd(decompress(buffer(data, chunkstart - offset, chunklength)))

949

950

return l

950

return l

951

952

def _chunkclear(self):

952

def _chunkclear(self):

953

self._chunkcache = (0, '')

953

self._chunkcache = (0, '')

954

955

def deltaparent(self, rev):

955

def deltaparent(self, rev):

956

"""return deltaparent of the given revision"""

956

"""return deltaparent of the given revision"""

957

base = self.index[rev][3]

957

base = self.index[rev][3]

958

if base == rev:

958

if base == rev:

959

return nullrev

959

return nullrev

960

elif self._generaldelta:

960

elif self._generaldelta:

961

return base

961

return base

962

else:

962

else:

963

return rev - 1

963

return rev - 1

964

965

def revdiff(self, rev1, rev2):

965

def revdiff(self, rev1, rev2):

966

"""return or calculate a delta between two revisions"""

966

"""return or calculate a delta between two revisions"""

967

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

967

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

968

return str(self._chunk(rev2))

968

return str(self._chunk(rev2))

969

970

return mdiff.textdiff(self.revision(rev1),

970

return mdiff.textdiff(self.revision(rev1),

971

self.revision(rev2))

971

self.revision(rev2))

972

973

def revision(self, nodeorrev):

973

def revision(self, nodeorrev):

974

"""return an uncompressed revision of a given node or revision

974

"""return an uncompressed revision of a given node or revision

975

number.

975

number.

976

"""

976

"""

977

if isinstance(nodeorrev, int):

977

if isinstance(nodeorrev, int):

978

rev = nodeorrev

978

rev = nodeorrev

979

node = self.node(rev)

979

node = self.node(rev)

980

else:

980

else:

981

node = nodeorrev

981

node = nodeorrev

982

rev = None

982

rev = None

983

984

_cache = self._cache # grab local copy of cache to avoid thread race

984

_cache = self._cache # grab local copy of cache to avoid thread race

985

cachedrev = None

985

cachedrev = None

986

if node == nullid:

986

if node == nullid:

987

return ""

987

return ""

988

if _cache:

988

if _cache:

989

if _cache[0] == node:

989

if _cache[0] == node:

990

return _cache[2]

990

return _cache[2]

991

cachedrev = _cache[1]

991

cachedrev = _cache[1]

992

993

# look up what we need to read

993

# look up what we need to read

994

text = None

994

text = None

995

if rev is None:

995

if rev is None:

996

rev = self.rev(node)

996

rev = self.rev(node)

997

998

# check rev flags

998

# check rev flags

999

if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:

999

if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:

1000

raise RevlogError(_('incompatible revision flag %x') %

1000

raise RevlogError(_('incompatible revision flag %x') %

1001

(self.flags(rev) & ~REVIDX_KNOWN_FLAGS))

1001

(self.flags(rev) & ~REVIDX_KNOWN_FLAGS))

1002

1003

# build delta chain

1003

# build delta chain

1004

chain = []

1004

chain = []

1005

index = self.index # for performance

1005

index = self.index # for performance

1006

generaldelta = self._generaldelta

1006

generaldelta = self._generaldelta

1007

iterrev = rev

1007

iterrev = rev

1008

e = index[iterrev]

1008

e = index[iterrev]

1009

while iterrev != e[3] and iterrev != cachedrev:

1009

while iterrev != e[3] and iterrev != cachedrev:

1010

chain.append(iterrev)

1010

chain.append(iterrev)

1011

if generaldelta:

1011

if generaldelta:

1012

iterrev = e[3]

1012

iterrev = e[3]

1013

else:

1013

else:

1014

iterrev -= 1

1014

iterrev -= 1

1015

e = index[iterrev]

1015

e = index[iterrev]

1016

1017

if iterrev == cachedrev:

1017

if iterrev == cachedrev:

1018

# cache hit

1018

# cache hit

1019

text = _cache[2]

1019

text = _cache[2]

1020

else:

1020

else:

1021

chain.append(iterrev)

1021

chain.append(iterrev)

1022

chain.reverse()

1022

chain.reverse()

1023

1024

# drop cache to save memory

1024

# drop cache to save memory

1025

self._cache = None

1025

self._cache = None

1026

1027

bins = self._chunks(chain)

1027

bins = self._chunks(chain)

1028

if text is None:

1028

if text is None:

1029

text = str(bins[0])

1029

text = str(bins[0])

1030

bins = bins[1:]

1030

bins = bins[1:]

1031

1032

text = mdiff.patches(text, bins)

1032

text = mdiff.patches(text, bins)

1033

1034

text = self._checkhash(text, node, rev)

1034

text = self._checkhash(text, node, rev)

1035

1036

self._cache = (node, rev, text)

1036

self._cache = (node, rev, text)

1037

return text

1037

return text

1038

1039

def hash(self, text, p1, p2):

1040

"""Compute a node hash.

1041

1042

Available as a function so that subclasses can replace the hash

1043

as needed.

1044

"""

1045

return hash(text, p1, p2)

1046

1039

def _checkhash(self, text, node, rev):

1047

def _checkhash(self, text, node, rev):

1040

p1, p2 = self.parents(node)

1048

p1, p2 = self.parents(node)

1041

self.checkhash(text, p1, p2, node, rev)

1049

self.checkhash(text, p1, p2, node, rev)

1042

return text

1050

return text

1043

1051

1044

def checkhash(self, text, p1, p2, node, rev=None):

1052

def checkhash(self, text, p1, p2, node, rev=None):

1045

if node != hash(text, p1, p2):

1053

if node != self.hash(text, p1, p2):

1046

revornode = rev

1054

revornode = rev

1047

if revornode is None:

1055

if revornode is None:

1048

revornode = templatefilters.short(hex(node))

1056

revornode = templatefilters.short(hex(node))

1049

raise RevlogError(_("integrity check failed on %s:%s")

1057

raise RevlogError(_("integrity check failed on %s:%s")

1050

% (self.indexfile, revornode))

1058

% (self.indexfile, revornode))

1051

1059

1052

def checkinlinesize(self, tr, fp=None):

1060

def checkinlinesize(self, tr, fp=None):

1053

if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:

1061

if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:

1054

return

1062

return

1055

1063

1056

trinfo = tr.find(self.indexfile)

1064

trinfo = tr.find(self.indexfile)

1057

if trinfo is None:

1065

if trinfo is None:

1058

raise RevlogError(_("%s not found in the transaction")

1066

raise RevlogError(_("%s not found in the transaction")

1059

% self.indexfile)

1067

% self.indexfile)

1060

1068

1061

trindex = trinfo[2]

1069

trindex = trinfo[2]

1062

dataoff = self.start(trindex)

1070

dataoff = self.start(trindex)

1063

1071

1064

tr.add(self.datafile, dataoff)

1072

tr.add(self.datafile, dataoff)

1065

1073

1066

if fp:

1074

if fp:

1067

fp.flush()

1075

fp.flush()

1068

fp.close()

1076

fp.close()

1069

1077

1070

df = self.opener(self.datafile, 'w')

1078

df = self.opener(self.datafile, 'w')

1071

try:

1079

try:

1072

for r in self:

1080

for r in self:

1073

df.write(self._chunkraw(r, r))

1081

df.write(self._chunkraw(r, r))

1074

finally:

1082

finally:

1075

df.close()

1083

df.close()

1076

1084

1077

fp = self.opener(self.indexfile, 'w', atomictemp=True)

1085

fp = self.opener(self.indexfile, 'w', atomictemp=True)

1078

self.version &= ~(REVLOGNGINLINEDATA)

1086

self.version &= ~(REVLOGNGINLINEDATA)

1079

self._inline = False

1087

self._inline = False

1080

for i in self:

1088

for i in self:

1081

e = self._io.packentry(self.index[i], self.node, self.version, i)

1089

e = self._io.packentry(self.index[i], self.node, self.version, i)

1082

fp.write(e)

1090

fp.write(e)

1083

1091

1084

# if we don't call close, the temp file will never replace the

1092

# if we don't call close, the temp file will never replace the

1085

# real index

1093

# real index

1086

fp.close()

1094

fp.close()

1087

1095

1088

tr.replace(self.indexfile, trindex * self._io.size)

1096

tr.replace(self.indexfile, trindex * self._io.size)

1089

self._chunkclear()

1097

self._chunkclear()

1090

1098

1091

def addrevision(self, text, transaction, link, p1, p2, cachedelta=None,

1099

def addrevision(self, text, transaction, link, p1, p2, cachedelta=None,

1092

node=None):

1100

node=None):

1093

"""add a revision to the log

1101

"""add a revision to the log

1094

1102

1095

text - the revision data to add

1103

text - the revision data to add

1096

transaction - the transaction object used for rollback

1104

transaction - the transaction object used for rollback

1097

link - the linkrev data to add

1105

link - the linkrev data to add

1098

p1, p2 - the parent nodeids of the revision

1106

p1, p2 - the parent nodeids of the revision

1099

cachedelta - an optional precomputed delta

1107

cachedelta - an optional precomputed delta

1100

node - nodeid of revision; typically node is not specified, and it is

1108

node - nodeid of revision; typically node is not specified, and it is

1101

computed by default as hash(text, p1, p2), however subclasses might

1109

computed by default as hash(text, p1, p2), however subclasses might

1102

use different hashing method (and override checkhash() in such case)

1110

use different hashing method (and override checkhash() in such case)

1103

"""

1111

"""

1104

if link == nullrev:

1112

if link == nullrev:

1105

raise RevlogError(_("attempted to add linkrev -1 to %s")

1113

raise RevlogError(_("attempted to add linkrev -1 to %s")

1106

% self.indexfile)

1114

% self.indexfile)

1107

node = node or hash(text, p1, p2)

1115

node = node or self.hash(text, p1, p2)

1108

if node in self.nodemap:

1116

if node in self.nodemap:

1109

return node

1117

return node

1110

1118

1111

dfh = None

1119

dfh = None

1112

if not self._inline:

1120

if not self._inline:

1113

dfh = self.opener(self.datafile, "a")

1121

dfh = self.opener(self.datafile, "a")

1114

ifh = self.opener(self.indexfile, "a+")

1122

ifh = self.opener(self.indexfile, "a+")

1115

try:

1123

try:

1116

return self._addrevision(node, text, transaction, link, p1, p2,

1124

return self._addrevision(node, text, transaction, link, p1, p2,

1117

cachedelta, ifh, dfh)

1125

cachedelta, ifh, dfh)

1118

finally:

1126

finally:

1119

if dfh:

1127

if dfh:

1120

dfh.close()

1128

dfh.close()

1121

ifh.close()

1129

ifh.close()

1122

1130

1123

def compress(self, text):

1131

def compress(self, text):

1124

""" generate a possibly-compressed representation of text """

1132

""" generate a possibly-compressed representation of text """

1125

if not text:

1133

if not text:

1126

return ("", text)

1134

return ("", text)

1127

l = len(text)

1135

l = len(text)

1128

bin = None

1136

bin = None

1129

if l < 44:

1137

if l < 44:

1130

pass

1138

pass

1131

elif l > 1000000:

1139

elif l > 1000000:

1132

# zlib makes an internal copy, thus doubling memory usage for

1140

# zlib makes an internal copy, thus doubling memory usage for

1133

# large files, so lets do this in pieces

1141

# large files, so lets do this in pieces

1134

z = zlib.compressobj()

1142

z = zlib.compressobj()

1135

p = []

1143

p = []

1136

pos = 0

1144

pos = 0

1137

while pos < l:

1145

while pos < l:

1138

pos2 = pos + 2**20

1146

pos2 = pos + 2**20

1139

p.append(z.compress(text[pos:pos2]))

1147

p.append(z.compress(text[pos:pos2]))

1140

pos = pos2

1148

pos = pos2

1141

p.append(z.flush())

1149

p.append(z.flush())

1142

if sum(map(len, p)) < l:

1150

if sum(map(len, p)) < l:

1143

bin = "".join(p)

1151

bin = "".join(p)

1144

else:

1152

else:

1145

bin = _compress(text)

1153

bin = _compress(text)

1146

if bin is None or len(bin) > l:

1154

if bin is None or len(bin) > l:

1147

if text[0] == '\0':

1155

if text[0] == '\0':

1148

return ("", text)

1156

return ("", text)

1149

return ('u', text)

1157

return ('u', text)

1150

return ("", bin)

1158

return ("", bin)

1151

1159

1152

def _addrevision(self, node, text, transaction, link, p1, p2,

1160

def _addrevision(self, node, text, transaction, link, p1, p2,

1153

cachedelta, ifh, dfh):

1161

cachedelta, ifh, dfh):

1154

"""internal function to add revisions to the log

1162

"""internal function to add revisions to the log

1155

1163

1156

see addrevision for argument descriptions.

1164

see addrevision for argument descriptions.

1157

invariants:

1165

invariants:

1158

- text is optional (can be None); if not set, cachedelta must be set.

1166

- text is optional (can be None); if not set, cachedelta must be set.

1159

if both are set, they must correspond to each other.

1167

if both are set, they must correspond to each other.

1160

"""

1168

"""

1161

btext = [text]

1169

btext = [text]

1162

def buildtext():

1170

def buildtext():

1163

if btext[0] is not None:

1171

if btext[0] is not None:

1164

return btext[0]

1172

return btext[0]

1165

# flush any pending writes here so we can read it in revision

1173

# flush any pending writes here so we can read it in revision

1166

if dfh:

1174

if dfh:

1167

dfh.flush()

1175

dfh.flush()

1168

ifh.flush()

1176

ifh.flush()

1169

basetext = self.revision(self.node(cachedelta[0]))

1177

basetext = self.revision(self.node(cachedelta[0]))

1170

btext[0] = mdiff.patch(basetext, cachedelta[1])

1178

btext[0] = mdiff.patch(basetext, cachedelta[1])

1171

self.checkhash(btext[0], p1, p2, node)

1179

self.checkhash(btext[0], p1, p2, node)

1172

return btext[0]

1180

return btext[0]

1173

1181

1174

def builddelta(rev):

1182

def builddelta(rev):

1175

# can we use the cached delta?

1183

# can we use the cached delta?

1176

if cachedelta and cachedelta[0] == rev:

1184

if cachedelta and cachedelta[0] == rev:

1177

delta = cachedelta[1]

1185

delta = cachedelta[1]

1178

else:

1186

else:

1179

t = buildtext()

1187

t = buildtext()

1180

ptext = self.revision(self.node(rev))

1188

ptext = self.revision(self.node(rev))

1181

delta = mdiff.textdiff(ptext, t)

1189

delta = mdiff.textdiff(ptext, t)

1182

data = self.compress(delta)

1190

data = self.compress(delta)

1183

l = len(data[1]) + len(data[0])

1191

l = len(data[1]) + len(data[0])

1184

if basecache[0] == rev:

1192

if basecache[0] == rev:

1185

chainbase = basecache[1]

1193

chainbase = basecache[1]

1186

else:

1194

else:

1187

chainbase = self.chainbase(rev)

1195

chainbase = self.chainbase(rev)

1188

dist = l + offset - self.start(chainbase)

1196

dist = l + offset - self.start(chainbase)

1189

if self._generaldelta:

1197

if self._generaldelta:

1190

base = rev

1198

base = rev

1191

else:

1199

else:

1192

base = chainbase

1200

base = chainbase

1193

return dist, l, data, base, chainbase

1201

return dist, l, data, base, chainbase

1194

1202

1195

curr = len(self)

1203

curr = len(self)

1196

prev = curr - 1

1204

prev = curr - 1

1197

base = chainbase = curr

1205

base = chainbase = curr

1198

offset = self.end(prev)

1206

offset = self.end(prev)

1199

flags = 0

1207

flags = 0

1200

d = None

1208

d = None

1201

if self._basecache is None:

1209

if self._basecache is None:

1202

self._basecache = (prev, self.chainbase(prev))

1210

self._basecache = (prev, self.chainbase(prev))

1203

basecache = self._basecache

1211

basecache = self._basecache

1204

p1r, p2r = self.rev(p1), self.rev(p2)

1212

p1r, p2r = self.rev(p1), self.rev(p2)

1205

1213

1206

# should we try to build a delta?

1214

# should we try to build a delta?

1207

if prev != nullrev:

1215

if prev != nullrev:

1208

if self._generaldelta:

1216

if self._generaldelta:

1209

if p1r >= basecache[1]:

1217

if p1r >= basecache[1]:

1210

d = builddelta(p1r)

1218

d = builddelta(p1r)

1211

elif p2r >= basecache[1]:

1219

elif p2r >= basecache[1]:

1212

d = builddelta(p2r)

1220

d = builddelta(p2r)

1213

else:

1221

else:

1214

d = builddelta(prev)

1222

d = builddelta(prev)

1215

else:

1223

else:

1216

d = builddelta(prev)

1224

d = builddelta(prev)

1217

dist, l, data, base, chainbase = d

1225

dist, l, data, base, chainbase = d

1218

1226

1219

# full versions are inserted when the needed deltas

1227

# full versions are inserted when the needed deltas

1220

# become comparable to the uncompressed text

1228

# become comparable to the uncompressed text

1221

if text is None:

1229

if text is None:

1222

textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),

1230

textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),

1223

cachedelta[1])

1231

cachedelta[1])

1224

else:

1232

else:

1225

textlen = len(text)

1233

textlen = len(text)

1226

if d is None or dist > textlen * 2:

1234

if d is None or dist > textlen * 2:

1227

text = buildtext()

1235

text = buildtext()

1228

data = self.compress(text)

1236

data = self.compress(text)

1229

l = len(data[1]) + len(data[0])

1237

l = len(data[1]) + len(data[0])

1230

base = chainbase = curr

1238

base = chainbase = curr

1231

1239

1232

e = (offset_type(offset, flags), l, textlen,

1240

e = (offset_type(offset, flags), l, textlen,

1233

base, link, p1r, p2r, node)

1241

base, link, p1r, p2r, node)

1234

self.index.insert(-1, e)

1242

self.index.insert(-1, e)

1235

self.nodemap[node] = curr

1243

self.nodemap[node] = curr

1236

1244

1237

entry = self._io.packentry(e, self.node, self.version, curr)

1245

entry = self._io.packentry(e, self.node, self.version, curr)

1238

self._writeentry(transaction, ifh, dfh, entry, data, link, offset)

1246

self._writeentry(transaction, ifh, dfh, entry, data, link, offset)

1239

1247

1240

if type(text) == str: # only accept immutable objects

1248

if type(text) == str: # only accept immutable objects

1241

self._cache = (node, curr, text)

1249

self._cache = (node, curr, text)

1242

self._basecache = (curr, chainbase)

1250

self._basecache = (curr, chainbase)

1243

return node

1251

return node

1244

1252

1245

def _writeentry(self, transaction, ifh, dfh, entry, data, link, offset):

1253

def _writeentry(self, transaction, ifh, dfh, entry, data, link, offset):

1246

curr = len(self) - 1

1254

curr = len(self) - 1

1247

if not self._inline:

1255

if not self._inline:

1248

transaction.add(self.datafile, offset)

1256

transaction.add(self.datafile, offset)

1249

transaction.add(self.indexfile, curr * len(entry))

1257

transaction.add(self.indexfile, curr * len(entry))

1250

if data[0]:

1258

if data[0]:

1251

dfh.write(data[0])

1259

dfh.write(data[0])

1252

dfh.write(data[1])

1260

dfh.write(data[1])

1253

dfh.flush()

1261

dfh.flush()

1254

ifh.write(entry)

1262

ifh.write(entry)

1255

else:

1263

else:

1256

offset += curr * self._io.size

1264

offset += curr * self._io.size

1257

transaction.add(self.indexfile, offset, curr)

1265

transaction.add(self.indexfile, offset, curr)

1258

ifh.write(entry)

1266

ifh.write(entry)

1259

ifh.write(data[0])

1267

ifh.write(data[0])

1260

ifh.write(data[1])

1268

ifh.write(data[1])

1261

self.checkinlinesize(transaction, ifh)

1269

self.checkinlinesize(transaction, ifh)

1262

1270

1263

def addgroup(self, bundle, linkmapper, transaction):

1271

def addgroup(self, bundle, linkmapper, transaction):

1264

"""

1272

"""

1265

add a delta group

1273

add a delta group

1266

1274

1267

given a set of deltas, add them to the revision log. the

1275

given a set of deltas, add them to the revision log. the

1268

first delta is against its parent, which should be in our

1276

first delta is against its parent, which should be in our

1269

log, the rest are against the previous delta.

1277

log, the rest are against the previous delta.

1270

"""

1278

"""

1271

1279

1272

# track the base of the current delta log

1280

# track the base of the current delta log

1273

content = []

1281

content = []

1274

node = None

1282

node = None

1275

1283

1276

r = len(self)

1284

r = len(self)

1277

end = 0

1285

end = 0

1278

if r:

1286

if r:

1279

end = self.end(r - 1)

1287

end = self.end(r - 1)

1280

ifh = self.opener(self.indexfile, "a+")

1288

ifh = self.opener(self.indexfile, "a+")

1281

isize = r * self._io.size

1289

isize = r * self._io.size

1282

if self._inline:

1290

if self._inline:

1283

transaction.add(self.indexfile, end + isize, r)

1291

transaction.add(self.indexfile, end + isize, r)

1284

dfh = None

1292

dfh = None

1285

else:

1293

else:

1286

transaction.add(self.indexfile, isize, r)

1294

transaction.add(self.indexfile, isize, r)

1287

transaction.add(self.datafile, end)

1295

transaction.add(self.datafile, end)

1288

dfh = self.opener(self.datafile, "a")

1296

dfh = self.opener(self.datafile, "a")

1289

1297

1290

try:

1298

try:

1291

# loop through our set of deltas

1299

# loop through our set of deltas

1292

chain = None

1300

chain = None

1293

while True:

1301

while True:

1294

chunkdata = bundle.deltachunk(chain)

1302

chunkdata = bundle.deltachunk(chain)

1295

if not chunkdata:

1303

if not chunkdata:

1296

break

1304

break

1297

node = chunkdata['node']

1305

node = chunkdata['node']

1298

p1 = chunkdata['p1']

1306

p1 = chunkdata['p1']

1299

p2 = chunkdata['p2']

1307

p2 = chunkdata['p2']

1300

cs = chunkdata['cs']

1308

cs = chunkdata['cs']

1301

deltabase = chunkdata['deltabase']

1309

deltabase = chunkdata['deltabase']

1302

delta = chunkdata['delta']

1310

delta = chunkdata['delta']

1303

1311

1304

content.append(node)

1312

content.append(node)

1305

1313

1306

link = linkmapper(cs)

1314

link = linkmapper(cs)

1307

if node in self.nodemap:

1315

if node in self.nodemap:

1308

# this can happen if two branches make the same change

1316

# this can happen if two branches make the same change

1309

chain = node

1317

chain = node

1310

continue

1318

continue

1311

1319

1312

for p in (p1, p2):

1320

for p in (p1, p2):

1313

if p not in self.nodemap:

1321

if p not in self.nodemap:

1314

raise LookupError(p, self.indexfile,

1322

raise LookupError(p, self.indexfile,

1315

_('unknown parent'))

1323

_('unknown parent'))

1316

1324

1317

if deltabase not in self.nodemap:

1325

if deltabase not in self.nodemap:

1318

raise LookupError(deltabase, self.indexfile,

1326

raise LookupError(deltabase, self.indexfile,

1319

_('unknown delta base'))

1327

_('unknown delta base'))

1320

1328

1321

baserev = self.rev(deltabase)

1329

baserev = self.rev(deltabase)

1322

chain = self._addrevision(node, None, transaction, link,

1330

chain = self._addrevision(node, None, transaction, link,

1323

p1, p2, (baserev, delta), ifh, dfh)

1331

p1, p2, (baserev, delta), ifh, dfh)

1324

if not dfh and not self._inline:

1332

if not dfh and not self._inline:

1325

# addrevision switched from inline to conventional

1333

# addrevision switched from inline to conventional

1326

# reopen the index

1334

# reopen the index

1327

ifh.close()

1335

ifh.close()

1328

dfh = self.opener(self.datafile, "a")

1336

dfh = self.opener(self.datafile, "a")

1329

ifh = self.opener(self.indexfile, "a")

1337

ifh = self.opener(self.indexfile, "a")

1330

finally:

1338

finally:

1331

if dfh:

1339

if dfh:

1332

dfh.close()

1340

dfh.close()

1333

ifh.close()

1341

ifh.close()

1334

1342

1335

return content

1343

return content

1336

1344

1337

def getstrippoint(self, minlink):

1345

def getstrippoint(self, minlink):

1338

"""find the minimum rev that must be stripped to strip the linkrev

1346

"""find the minimum rev that must be stripped to strip the linkrev

1339

1347

1340

Returns a tuple containing the minimum rev and a set of all revs that

1348

Returns a tuple containing the minimum rev and a set of all revs that

1341

have linkrevs that will be broken by this strip.

1349

have linkrevs that will be broken by this strip.

1342

"""

1350

"""

1343

brokenrevs = set()

1351

brokenrevs = set()

1344

strippoint = len(self)

1352

strippoint = len(self)

1345

1353

1346

heads = {}

1354

heads = {}

1347

futurelargelinkrevs = set()

1355

futurelargelinkrevs = set()

1348

for head in self.headrevs():

1356

for head in self.headrevs():

1349

headlinkrev = self.linkrev(head)

1357

headlinkrev = self.linkrev(head)

1350

heads[head] = headlinkrev

1358

heads[head] = headlinkrev

1351

if headlinkrev >= minlink:

1359

if headlinkrev >= minlink:

1352

futurelargelinkrevs.add(headlinkrev)

1360

futurelargelinkrevs.add(headlinkrev)

1353

1361

1354

# This algorithm involves walking down the rev graph, starting at the

1362

# This algorithm involves walking down the rev graph, starting at the

1355

# heads. Since the revs are topologically sorted according to linkrev,

1363

# heads. Since the revs are topologically sorted according to linkrev,

1356

# once all head linkrevs are below the minlink, we know there are

1364

# once all head linkrevs are below the minlink, we know there are

1357

# no more revs that could have a linkrev greater than minlink.

1365

# no more revs that could have a linkrev greater than minlink.

1358

# So we can stop walking.

1366

# So we can stop walking.

1359

while futurelargelinkrevs:

1367

while futurelargelinkrevs:

1360

strippoint -= 1

1368

strippoint -= 1

1361

linkrev = heads.pop(strippoint)

1369

linkrev = heads.pop(strippoint)

1362

1370

1363

if linkrev < minlink:

1371

if linkrev < minlink:

1364

brokenrevs.add(strippoint)

1372

brokenrevs.add(strippoint)

1365

else:

1373

else:

1366

futurelargelinkrevs.remove(linkrev)

1374

futurelargelinkrevs.remove(linkrev)

1367

1375

1368

for p in self.parentrevs(strippoint):

1376

for p in self.parentrevs(strippoint):

1369

if p != nullrev:

1377

if p != nullrev:

1370

plinkrev = self.linkrev(p)

1378

plinkrev = self.linkrev(p)

1371

heads[p] = plinkrev

1379

heads[p] = plinkrev

1372

if plinkrev >= minlink:

1380

if plinkrev >= minlink:

1373

futurelargelinkrevs.add(plinkrev)

1381

futurelargelinkrevs.add(plinkrev)

1374

1382

1375

return strippoint, brokenrevs

1383

return strippoint, brokenrevs

1376

1384

1377

def strip(self, minlink, transaction):

1385

def strip(self, minlink, transaction):

1378

"""truncate the revlog on the first revision with a linkrev >= minlink

1386

"""truncate the revlog on the first revision with a linkrev >= minlink

1379

1387

1380

This function is called when we're stripping revision minlink and

1388

This function is called when we're stripping revision minlink and

1381

its descendants from the repository.

1389

its descendants from the repository.

1382

1390

1383

We have to remove all revisions with linkrev >= minlink, because

1391

We have to remove all revisions with linkrev >= minlink, because

1384

the equivalent changelog revisions will be renumbered after the

1392

the equivalent changelog revisions will be renumbered after the

1385

strip.

1393

strip.

1386

1394

1387

So we truncate the revlog on the first of these revisions, and

1395

So we truncate the revlog on the first of these revisions, and

1388

trust that the caller has saved the revisions that shouldn't be

1396

trust that the caller has saved the revisions that shouldn't be

1389

removed and that it'll re-add them after this truncation.

1397

removed and that it'll re-add them after this truncation.

1390

"""

1398

"""

1391

if len(self) == 0:

1399

if len(self) == 0:

1392

return

1400

return

1393

1401

1394

rev, _ = self.getstrippoint(minlink)

1402

rev, _ = self.getstrippoint(minlink)

1395

if rev == len(self):

1403

if rev == len(self):

1396

return

1404

return

1397

1405

1398

# first truncate the files on disk

1406

# first truncate the files on disk

1399

end = self.start(rev)

1407

end = self.start(rev)

1400

if not self._inline:

1408

if not self._inline:

1401

transaction.add(self.datafile, end)

1409

transaction.add(self.datafile, end)

1402

end = rev * self._io.size

1410

end = rev * self._io.size

1403

else:

1411

else:

1404

end += rev * self._io.size

1412

end += rev * self._io.size

1405

1413

1406

transaction.add(self.indexfile, end)

1414

transaction.add(self.indexfile, end)

1407

1415

1408

# then reset internal state in memory to forget those revisions

1416

# then reset internal state in memory to forget those revisions

1409

self._cache = None

1417

self._cache = None

1410

self._chunkclear()

1418

self._chunkclear()

1411

for x in xrange(rev, len(self)):

1419

for x in xrange(rev, len(self)):

1412

del self.nodemap[self.node(x)]

1420

del self.nodemap[self.node(x)]

1413

1421

1414

del self.index[rev:-1]

1422

del self.index[rev:-1]

1415

1423

1416

def checksize(self):

1424

def checksize(self):

1417

expected = 0

1425

expected = 0

1418

if len(self):

1426

if len(self):

1419

expected = max(0, self.end(len(self) - 1))

1427

expected = max(0, self.end(len(self) - 1))

1420

1428

1421

try:

1429

try:

1422

f = self.opener(self.datafile)

1430

f = self.opener(self.datafile)

1423

f.seek(0, 2)

1431

f.seek(0, 2)

1424

actual = f.tell()

1432

actual = f.tell()

1425

f.close()

1433

f.close()

1426

dd = actual - expected

1434

dd = actual - expected

1427

except IOError, inst:

1435

except IOError, inst:

1428

if inst.errno != errno.ENOENT:

1436

if inst.errno != errno.ENOENT:

1429

raise

1437

raise

1430

dd = 0

1438

dd = 0

1431

1439

1432

try:

1440

try:

1433

f = self.opener(self.indexfile)

1441

f = self.opener(self.indexfile)

1434

f.seek(0, 2)

1442

f.seek(0, 2)

1435

actual = f.tell()

1443

actual = f.tell()

1436

f.close()

1444

f.close()

1437

s = self._io.size

1445

s = self._io.size

1438

i = max(0, actual // s)

1446

i = max(0, actual // s)

1439

di = actual - (i * s)

1447

di = actual - (i * s)

1440

if self._inline:

1448

if self._inline:

1441

databytes = 0

1449

databytes = 0

1442

for r in self:

1450

for r in self:

1443

databytes += max(0, self.length(r))

1451

databytes += max(0, self.length(r))

1444

dd = 0

1452

dd = 0

1445

di = actual - len(self) * s - databytes

1453

di = actual - len(self) * s - databytes

1446

except IOError, inst:

1454

except IOError, inst:

1447

if inst.errno != errno.ENOENT:

1455

if inst.errno != errno.ENOENT:

1448

raise

1456

raise

1449

di = 0

1457

di = 0

1450

1458

1451

return (dd, di)

1459

return (dd, di)

1452

1460

1453

def files(self):

1461

def files(self):

1454

res = [self.indexfile]

1462

res = [self.indexfile]

1455

if not self._inline:

1463

if not self._inline:

1456

res.append(self.datafile)

1464

res.append(self.datafile)

1457

return res

1465

return res

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # revlog.py - storage back-end for mercurial
             #
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             # import stuff from node for others to import from revlog
             from node import bin, hex, nullid, nullrev
             from i18n import _
             import ancestor, mdiff, parsers, error, util, templatefilters
             import struct, zlib, errno
             _pack = struct.pack
             _unpack = struct.unpack
             _compress = zlib.compress
             _decompress = zlib.decompress
             _sha = util.sha1
             # revlog header flags
             REVLOGV0 = 0
             REVLOGNG = 1
             REVLOGNGINLINEDATA = (1 << 16)
             REVLOGGENERALDELTA = (1 << 17)
             REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA
             REVLOG_DEFAULT_FORMAT = REVLOGNG
             REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS
             REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGGENERALDELTA
             # revlog index flags
             REVIDX_KNOWN_FLAGS = 0
             # max size of revlog with inline data
             _maxinline = 131072
             _chunksize = 1048576
             RevlogError = error.RevlogError
             LookupError = error.LookupError
             def getoffset(q):
                 return int(q >> 16)
             def gettype(q):
                 return int(q & 0xFFFF)
             def offset_type(offset, type):
                 return long(long(offset) << 16 | type)
             _nullhash = _sha(nullid)
             def hash(text, p1, p2):
                 """generate a hash from the given text and its parent hashes
                 This hash combines both the current file contents and its history
                 in a manner that makes it easy to distinguish nodes with the same
                 content in the revision graph.
                 """
                 # As of now, if one of the parent node is null, p2 is null
                 if p2 == nullid:
                     # deep copy of a hash is faster than creating one
                     s = _nullhash.copy()
                     s.update(p1)
                 else:
                     # none of the parent nodes are nullid
                     l = [p1, p2]
                     l.sort()
                     s = _sha(l[0])
                     s.update(l[1])
                 s.update(text)
                 return s.digest()
             def decompress(bin):
                 """ decompress the given input """
                 if not bin:
                     return bin
                 t = bin[0]
                 if t == '\0':
                     return bin
                 if t == 'x':
                     try:
                         return _decompress(bin)
                     except zlib.error, e:
                         raise RevlogError(_("revlog decompress error: %s") % str(e))
                 if t == 'u':
                     return bin[1:]
                 raise RevlogError(_("unknown compression type %r") % t)
             # index v0:
             #  4 bytes: offset
             #  4 bytes: compressed length
             #  4 bytes: base rev
             #  4 bytes: link rev
             # 32 bytes: parent 1 nodeid
             # 32 bytes: parent 2 nodeid
             # 32 bytes: nodeid
             indexformatv0 = ">4l20s20s20s"
             v0shaoffset = 56
             class revlogoldio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatv0)
                 def parseindex(self, data, inline):
                     s = self.size
                     index = []
                     nodemap =  {nullid: nullrev}
                     n = off = 0
                     l = len(data)
                     while off + s <= l:
                         cur = data[off:off + s]
                         off += s
                         e = _unpack(indexformatv0, cur)
                         # transform to revlogv1 format
                         e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],
                               nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])
                         index.append(e2)
                         nodemap[e[6]] = n
                         n += 1
                     # add the magic null revision at -1
                     index.append((0, 0, 0, -1, -1, -1, -1, nullid))
                     return index, nodemap, None
                 def packentry(self, entry, node, version, rev):
                     if gettype(entry[0]):
                         raise RevlogError(_("index entry flags need RevlogNG"))
                     e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],
                           node(entry[5]), node(entry[6]), entry[7])
                     return _pack(indexformatv0, *e2)
             # index ng:
             #  6 bytes: offset
             #  2 bytes: flags
             #  4 bytes: compressed length
             #  4 bytes: uncompressed length
             #  4 bytes: base rev
             #  4 bytes: link rev
             #  4 bytes: parent 1 rev
             #  4 bytes: parent 2 rev
             # 32 bytes: nodeid
             indexformatng = ">Qiiiiii20s12x"
             ngshaoffset = 32
             versionformat = ">I"
             class revlogio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatng)
                 def parseindex(self, data, inline):
                     # call the C implementation to parse the index data
                     index, cache = parsers.parse_index2(data, inline)
                     return index, getattr(index, 'nodemap', None), cache
                 def packentry(self, entry, node, version, rev):
                     p = _pack(indexformatng, *entry)
                     if rev == 0:
                         p = _pack(versionformat, version) + p[4:]
                     return p
             class revlog(object):
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 """
                 def __init__(self, opener, indexfile):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     """
                     self.indexfile = indexfile
                     self.datafile = indexfile[:-2] + ".d"
                     self.opener = opener
                     self._cache = None
                     self._basecache = None
                     self._chunkcache = (0, '')
                     self._chunkcachesize = 65536
                     self.index = []
                     self._pcache = {}
                     self._nodecache = {nullid: nullrev}
                     self._nodepos = None
                     v = REVLOG_DEFAULT_VERSION
                     opts = getattr(opener, 'options', None)
                     if opts is not None:
                         if 'revlogv1' in opts:
                             if 'generaldelta' in opts:
                                 v |= REVLOGGENERALDELTA
                         else:
                             v = 0
                         if 'chunkcachesize' in opts:
                             self._chunkcachesize = opts['chunkcachesize']
                     if self._chunkcachesize <= 0:
                         raise RevlogError(_('revlog chunk cache size %r is not greater '
                                             'than 0') % self._chunkcachesize)
                     elif self._chunkcachesize & (self._chunkcachesize - 1):
                         raise RevlogError(_('revlog chunk cache size %r is not a power '
                                             'of 2') % self._chunkcachesize)
                     i = ''
                     self._initempty = True
                     try:
                         f = self.opener(self.indexfile)
                         i = f.read()
                         f.close()
                         if len(i) > 0:
                             v = struct.unpack(versionformat, i[:4])[0]
                             self._initempty = False
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                     self.version = v
                     self._inline = v & REVLOGNGINLINEDATA
                     self._generaldelta = v & REVLOGGENERALDELTA
                     flags = v & ~0xFFFF
                     fmt = v & 0xFFFF
                     if fmt == REVLOGV0 and flags:
                         raise RevlogError(_("index %s unknown flags %#04x for format v0")
                                           % (self.indexfile, flags >> 16))
                     elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:
                         raise RevlogError(_("index %s unknown flags %#04x for revlogng")
                                           % (self.indexfile, flags >> 16))
                     elif fmt > REVLOGNG:
                         raise RevlogError(_("index %s unknown format %d")
                                           % (self.indexfile, fmt))
                     self._io = revlogio()
                     if self.version == REVLOGV0:
                         self._io = revlogoldio()
                     try:
                         d = self._io.parseindex(i, self._inline)
                     except (ValueError, IndexError):
                         raise RevlogError(_("index %s is corrupted") % (self.indexfile))
                     self.index, nodemap, self._chunkcache = d
                     if nodemap is not None:
                         self.nodemap = self._nodecache = nodemap
                     if not self._chunkcache:
                         self._chunkclear()
                 def tip(self):
                     return self.node(len(self.index) - 2)
                 def __len__(self):
                     return len(self.index) - 1
                 def __iter__(self):
                     return iter(xrange(len(self)))
                 def revs(self, start=0, stop=None):
                     """iterate over all rev in this revlog (from start to stop)"""
                     step = 1
                     if stop is not None:
                         if start > stop:
                             step = -1
                         stop += step
                     else:
                         stop = len(self)
                     return xrange(start, stop, step)
                 @util.propertycache
                 def nodemap(self):
                     self.rev(self.node(0))
                     return self._nodecache
                 def hasnode(self, node):
                     try:
                         self.rev(node)
                         return True
                     except KeyError:
                         return False
                 def clearcaches(self):
                     try:
                         self._nodecache.clearcaches()
                     except AttributeError:
                         self._nodecache = {nullid: nullrev}
                         self._nodepos = None
                 def rev(self, node):
                     try:
                         return self._nodecache[node]
                     except TypeError:
                         raise
                     except RevlogError:
                         # parsers.c radix tree lookup failed
                         raise LookupError(node, self.indexfile, _('no node'))
                     except KeyError:
                         # pure python cache lookup failed
                         n = self._nodecache
                         i = self.index
                         p = self._nodepos
                         if p is None:
                             p = len(i) - 2
                         for r in xrange(p, -1, -1):
                             v = i[r][7]
                             n[v] = r
                             if v == node:
                                 self._nodepos = r - 1
                                 return r
                         raise LookupError(node, self.indexfile, _('no node'))
                 def node(self, rev):
                     return self.index[rev][7]
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline
                 def parentrevs(self, rev):
                     return self.index[rev][5:7]
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def length(self, rev):
                     return self.index[rev][1]
                 def chainbase(self, rev):
                     index = self.index
                     base = index[rev][3]
                     while base != rev:
                         rev = base
                         base = index[rev][3]
                     return base
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.revision(self.node(rev))
                     return len(t)
                 size = rawsize
                 def ancestors(self, revs, stoprev=0, inclusive=False):
                     """Generate the ancestors of 'revs' in reverse topological order.
                     Does not generate revs lower than stoprev.
                     See the documentation for ancestor.lazyancestors for more details."""
                     return ancestor.lazyancestors(self, revs, stoprev=stoprev,
                                                   inclusive=inclusive)
                 def descendants(self, revs):
                     """Generate the descendants of 'revs' in revision order.
                     Yield a sequence of revision numbers starting with a child of
                     some rev in revs, i.e., each revision is *not* considered a
                     descendant of itself.  Results are ordered by revision number (a
                     topological sort)."""
                     first = min(revs)
                     if first == nullrev:
                         for i in self:
                             yield i
                         return
                     seen = set(revs)
                     for i in self.revs(start=first + 1):
                         for x in self.parentrevs(i):
                             if x != nullrev and x in seen:
                                 seen.add(i)
                                 yield i
                                 break
                 def findcommonmissing(self, common=None, heads=None):
                     """Return a tuple of the ancestors of common and the ancestors of heads
                     that are not ancestors of common. In revset terminology, we return the
                     tuple:
                       ::common, (::heads) - (::common)
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     class lazyset(object):
                         def __init__(self, lazyvalues):
                             self.addedvalues = set()
                             self.lazyvalues = lazyvalues
                         def __contains__(self, value):
                             return value in self.addedvalues or value in self.lazyvalues
                         def __iter__(self):
                             added = self.addedvalues
                             for r in added:
                                 yield r
                             for r in self.lazyvalues:
                                 if not r in added:
                                     yield r
                         def add(self, value):
                             self.addedvalues.add(value)
                         def update(self, values):
                             self.addedvalues.update(values)
                     has = lazyset(self.ancestors(common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = util.deque(r for r in heads if r not in has)
                     while visit:
                         r = visit.popleft()
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return has, [self.node(r) for r in missing]
                 def findmissingrevs(self, common=None, heads=None):
                     """Return the revision numbers of the ancestors of heads that
                     are not ancestors of common.
                     More specifically, return a list of revision numbers corresponding to
                     nodes N such that every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of revision numbers.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullrev]
                     if heads is None:
                         heads = self.headrevs()
                     return ancestor.missingancestors(heads, common, self.parentrevs)
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     return [self.node(r) for r in
                             ancestor.missingancestors(heads, common, self.parentrevs)]
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [nullid] # Everybody's a descendant of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return ([self.node(r) for r in self], [nullid], list(self.heads()))
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, False)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendant of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n) # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update([p for p in self.parents(n) if
                                                        p != nullid])
                                 elif n in heads: # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [n for n in roots if n in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(n) for n in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [nullid]
                     # Transform our roots list into a set.
                     descendants = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendants.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descendants, empty parents will look like
                     # they're descendants.
                     for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):
                         n = self.node(r)
                         isdescendant = False
                         if lowestrev == nullrev:  # Everybody is a descendant of nullid
                             isdescendant = True
                         elif n in descendants:
                             # n is already a descendant
                             isdescendant = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendants before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendants, it's not a root.
                                 if (p[0] in descendants) or (p[1] in descendants):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendant if either of its parents are
                             # descendants.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendants) or (p[1] in descendants):
                                 descendants.add(n)
                                 isdescendant = True
                         if isdescendant and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendants and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = True
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = True
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [n for n, flag in heads.iteritems() if flag]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def headrevs(self):
                     try:
                         return self.index.headrevs()
                     except AttributeError:
                         return self._headrevs()
                 def _headrevs(self):
                     count = len(self)
                     if not count:
                         return [nullrev]
                     # we won't iter over filtered rev so nobody is a head at start
                     ishead = [0] * (count + 1)
                     index = self.index
                     for r in self:
                         ishead[r] = 1  # I may be an head
                         e = index[r]
                         ishead[e[5]] = ishead[e[6]] = 0  # my parent are not
                     return [r for r, val in enumerate(ishead) if val]
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         if not len(self):
                             return [nullid]
                         return [self.node(r) for r in self.headrevs()]
                     if start is None:
                         start = nullid
                     if stop is None:
                         stop = []
                     stoprevs = set([self.rev(n) for n in stop])
                     startrev = self.rev(start)
                     reachable = set((startrev,))
                     heads = set((startrev,))
                     parentrevs = self.parentrevs
                     for r in self.revs(start=startrev + 1):
                         for p in parentrevs(r):
                             if p in reachable:
                                 if r not in stoprevs:
                                     reachable.add(r)
                                 heads.add(r)
                             if p in heads and p not in stoprevs:
                                 heads.remove(p)
                     return [self.node(r) for r in heads]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in self.revs(start=p + 1):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def descendant(self, start, end):
                     if start == nullrev:
                         return True
                     for i in self.descendants([start]):
                         if i == end:
                             return True
                         elif i > end:
                             break
                     return False
                 def commonancestorsheads(self, a, b):
                     """calculate all the heads of the common ancestors of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     try:
                         ancs = self.index.commonancestorsheads(a, b)
                     except (AttributeError, OverflowError): # C implementation failed
                         ancs = ancestor.commonancestorsheads(self.parentrevs, a, b)
                     return map(self.node, ancs)
                 def isancestor(self, a, b):
                     """return True if node a is an ancestor of node b
                     The implementation of this is trivial but the use of
                     commonancestorsheads is not."""
                     return a in self.commonancestorsheads(a, b)
                 def ancestor(self, a, b):
                     """calculate the "best" common ancestor of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     try:
                         ancs = self.index.ancestors(a, b)
                     except (AttributeError, OverflowError):
                         ancs = ancestor.ancestors(self.parentrevs, a, b)
                     if ancs:
                         # choose a consistent winner when there's a tie
                         return min(map(self.node, ancs))
                     return nullid
                 def _match(self, id):
                     if isinstance(id, int):
                         # rev
                         return self.node(id)
                     if len(id) == 20:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node) # quick search the index
                             return node
                         except LookupError:
                             pass # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if str(rev) != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 40:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (TypeError, LookupError):
                             pass
                 def _partialmatch(self, id):
                     try:
                         n = self.index.partialmatch(id)
                         if n and self.hasnode(n):
                             return n
                         return None
                     except RevlogError:
                         # parsers.c radix tree lookup gave multiple matches
                         # fall through to slow path that filters hidden revisions
                         pass
                     except (AttributeError, ValueError):
                         # we are pure python, or key was too short to search radix tree
                         pass
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) < 40:
                         try:
                             # hex(node)[:...]
                             l = len(id) // 2  # grab an even number of digits
                             prefix = bin(id[:l * 2])
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [n for n in nl if hex(n).startswith(id) and
                                   self.hasnode(n)]
                             if len(nl) > 0:
                                 if len(nl) == 1:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise LookupError(id, self.indexfile,
                                                   _('ambiguous identifier'))
                             return None
                         except TypeError:
                             pass
                 def lookup(self, id):
                     """locate a node based on:
                         - revision number or str(revision number)
                         - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise LookupError(id, self.indexfile, _('no match found'))
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return hash(text, p1, p2) != node
                 def _addchunk(self, offset, data):
                     o, d = self._chunkcache
                     # try to add to existing cache
                     if o + len(d) == offset and len(d) + len(data) < _chunksize:
                         self._chunkcache = o, d + data
                     else:
                         self._chunkcache = offset, data
                 def _loadchunk(self, offset, length):
                     if self._inline:
                         df = self.opener(self.indexfile)
                     else:
                         df = self.opener(self.datafile)
                     # Cache data both forward and backward around the requested
                     # data, in a fixed size window. This helps speed up operations
                     # involving reading the revlog backwards.
                     cachesize = self._chunkcachesize
                     realoffset = offset & ~(cachesize - 1)
                     reallength = (((offset + length + cachesize) & ~(cachesize - 1))
                                   - realoffset)
                     df.seek(realoffset)
                     d = df.read(reallength)
                     df.close()
                     self._addchunk(realoffset, d)
                     if offset != realoffset or reallength != length:
                         return util.buffer(d, offset - realoffset, length)
                     return d
                 def _getchunk(self, offset, length):
                     o, d = self._chunkcache
                     l = len(d)
                     # is it in the cache?
                     cachestart = offset - o
                     cacheend = cachestart + length
                     if cachestart >= 0 and cacheend <= l:
                         if cachestart == 0 and cacheend == l:
                             return d # avoid a copy
                         return util.buffer(d, cachestart, cacheend - cachestart)
                     return self._loadchunk(offset, length)
                 def _chunkraw(self, startrev, endrev):
                     start = self.start(startrev)
                     end = self.end(endrev)
                     if self._inline:
                         start += (startrev + 1) * self._io.size
                         end += (endrev + 1) * self._io.size
                     length = end - start
                     return self._getchunk(start, length)
                 def _chunk(self, rev):
                     return decompress(self._chunkraw(rev, rev))
                 def _chunks(self, revs):
                     '''faster version of [self._chunk(rev) for rev in revs]
                     Assumes that revs is in ascending order.'''
                     if not revs:
                         return []
                     start = self.start
                     length = self.length
                     inline = self._inline
                     iosize = self._io.size
                     buffer = util.buffer
                     l = []
                     ladd = l.append
                     # preload the cache
                     try:
                         while True:
                             # ensure that the cache doesn't change out from under us
                             _cache = self._chunkcache
                             self._chunkraw(revs[0], revs[-1])
                             if _cache == self._chunkcache:
                                 break
                         offset, data = _cache
                     except OverflowError:
                         # issue4215 - we can't cache a run of chunks greater than
                         # 2G on Windows
                         return [self._chunk(rev) for rev in revs]
                     for rev in revs:
                         chunkstart = start(rev)
                         if inline:
                             chunkstart += (rev + 1) * iosize
                         chunklength = length(rev)
                         ladd(decompress(buffer(data, chunkstart - offset, chunklength)))
                     return l
                 def _chunkclear(self):
                     self._chunkcache = (0, '')
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self._generaldelta:
                         return base
                     else:
                         return rev - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions"""
                     if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                         return str(self._chunk(rev2))
                     return mdiff.textdiff(self.revision(rev1),
                                           self.revision(rev2))
                 def revision(self, nodeorrev):
                     """return an uncompressed revision of a given node or revision
                     number.
                     """
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                         node = self.node(rev)
                     else:
                         node = nodeorrev
                         rev = None
                     _cache = self._cache # grab local copy of cache to avoid thread race
                     cachedrev = None
                     if node == nullid:
                         return ""
                     if _cache:
                         if _cache[0] == node:
                             return _cache[2]
                         cachedrev = _cache[1]
                     # look up what we need to read
                     text = None
                     if rev is None:
                         rev = self.rev(node)
                     # check rev flags
                     if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:
                         raise RevlogError(_('incompatible revision flag %x') %
                                           (self.flags(rev) & ~REVIDX_KNOWN_FLAGS))
                     # build delta chain
                     chain = []
                     index = self.index # for performance
                     generaldelta = self._generaldelta
                     iterrev = rev
                     e = index[iterrev]
                     while iterrev != e[3] and iterrev != cachedrev:
                         chain.append(iterrev)
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         e = index[iterrev]
                     if iterrev == cachedrev:
                         # cache hit
                         text = _cache[2]
                     else:
                         chain.append(iterrev)
                     chain.reverse()
                     # drop cache to save memory
                     self._cache = None
                     bins = self._chunks(chain)
                     if text is None:
                         text = str(bins[0])
                         bins = bins[1:]
                     text = mdiff.patches(text, bins)
                     text = self._checkhash(text, node, rev)
                     self._cache = (node, rev, text)
                     return text
+                def hash(self, text, p1, p2):
+                    """Compute a node hash.
+                    Available as a function so that subclasses can replace the hash
+                    as needed.
+                    """
+                    return hash(text, p1, p2)
                 def _checkhash(self, text, node, rev):
                     p1, p2 = self.parents(node)
                     self.checkhash(text, p1, p2, node, rev)
                     return text
                 def checkhash(self, text, p1, p2, node, rev=None):
-                    if node != hash(text, p1, p2):
+                    if node != self.hash(text, p1, p2):
                         revornode = rev
                         if revornode is None:
                             revornode = templatefilters.short(hex(node))
                         raise RevlogError(_("integrity check failed on %s:%s")
                             % (self.indexfile, revornode))
                 def checkinlinesize(self, tr, fp=None):
                     if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:
                         return
                     trinfo = tr.find(self.indexfile)
                     if trinfo is None:
                         raise RevlogError(_("%s not found in the transaction")
                                           % self.indexfile)
                     trindex = trinfo[2]
                     dataoff = self.start(trindex)
                     tr.add(self.datafile, dataoff)
                     if fp:
                         fp.flush()
                         fp.close()
                     df = self.opener(self.datafile, 'w')
                     try:
                         for r in self:
                             df.write(self._chunkraw(r, r))
                     finally:
                         df.close()
                     fp = self.opener(self.indexfile, 'w', atomictemp=True)
                     self.version &= ~(REVLOGNGINLINEDATA)
                     self._inline = False
                     for i in self:
                         e = self._io.packentry(self.index[i], self.node, self.version, i)
                         fp.write(e)
                     # if we don't call close, the temp file will never replace the
                     # real index
                     fp.close()
                     tr.replace(self.indexfile, trindex * self._io.size)
                     self._chunkclear()
                 def addrevision(self, text, transaction, link, p1, p2, cachedelta=None,
                                 node=None):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     node - nodeid of revision; typically node is not specified, and it is
                         computed by default as hash(text, p1, p2), however subclasses might
                         use different hashing method (and override checkhash() in such case)
                     """
                     if link == nullrev:
                         raise RevlogError(_("attempted to add linkrev -1 to %s")
                                           % self.indexfile)
-                    node = node or hash(text, p1, p2)
+                    node = node or self.hash(text, p1, p2)
                     if node in self.nodemap:
                         return node
                     dfh = None
                     if not self._inline:
                         dfh = self.opener(self.datafile, "a")
                     ifh = self.opener(self.indexfile, "a+")
                     try:
                         return self._addrevision(node, text, transaction, link, p1, p2,
                                                  cachedelta, ifh, dfh)
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                 def compress(self, text):
                     """ generate a possibly-compressed representation of text """
                     if not text:
                         return ("", text)
                     l = len(text)
                     bin = None
                     if l < 44:
                         pass
                     elif l > 1000000:
                         # zlib makes an internal copy, thus doubling memory usage for
                         # large files, so lets do this in pieces
                         z = zlib.compressobj()
                         p = []
                         pos = 0
                         while pos < l:
                             pos2 = pos + 2**20
                             p.append(z.compress(text[pos:pos2]))
                             pos = pos2
                         p.append(z.flush())
                         if sum(map(len, p)) < l:
                             bin = "".join(p)
                     else:
                         bin = _compress(text)
                     if bin is None or len(bin) > l:
                         if text[0] == '\0':
                             return ("", text)
                         return ('u', text)
                     return ("", bin)
                 def _addrevision(self, node, text, transaction, link, p1, p2,
                                  cachedelta, ifh, dfh):
                     """internal function to add revisions to the log
                     see addrevision for argument descriptions.
                     invariants:
                     - text is optional (can be None); if not set, cachedelta must be set.
                       if both are set, they must correspond to each other.
                     """
                     btext = [text]
                     def buildtext():
                         if btext[0] is not None:
                             return btext[0]
                         # flush any pending writes here so we can read it in revision
                         if dfh:
                             dfh.flush()
                         ifh.flush()
                         basetext = self.revision(self.node(cachedelta[0]))
                         btext[0] = mdiff.patch(basetext, cachedelta[1])
                         self.checkhash(btext[0], p1, p2, node)
                         return btext[0]
                     def builddelta(rev):
                         # can we use the cached delta?
                         if cachedelta and cachedelta[0] == rev:
                             delta = cachedelta[1]
                         else:
                             t = buildtext()
                             ptext = self.revision(self.node(rev))
                             delta = mdiff.textdiff(ptext, t)
                         data = self.compress(delta)
                         l = len(data[1]) + len(data[0])
                         if basecache[0] == rev:
                             chainbase = basecache[1]
                         else:
                             chainbase = self.chainbase(rev)
                         dist = l + offset - self.start(chainbase)
                         if self._generaldelta:
                             base = rev
                         else:
                             base = chainbase
                         return dist, l, data, base, chainbase
                     curr = len(self)
                     prev = curr - 1
                     base = chainbase = curr
                     offset = self.end(prev)
                     flags = 0
                     d = None
                     if self._basecache is None:
                         self._basecache = (prev, self.chainbase(prev))
                     basecache = self._basecache
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # should we try to build a delta?
                     if prev != nullrev:
                         if self._generaldelta:
                             if p1r >= basecache[1]:
                                 d = builddelta(p1r)
                             elif p2r >= basecache[1]:
                                 d = builddelta(p2r)
                             else:
                                 d = builddelta(prev)
                         else:
                             d = builddelta(prev)
                         dist, l, data, base, chainbase = d
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if text is None:
                         textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),
                                                     cachedelta[1])
                     else:
                         textlen = len(text)
                     if d is None or dist > textlen * 2:
                         text = buildtext()
                         data = self.compress(text)
                         l = len(data[1]) + len(data[0])
                         base = chainbase = curr
                     e = (offset_type(offset, flags), l, textlen,
                          base, link, p1r, p2r, node)
                     self.index.insert(-1, e)
                     self.nodemap[node] = curr
                     entry = self._io.packentry(e, self.node, self.version, curr)
                     self._writeentry(transaction, ifh, dfh, entry, data, link, offset)
                     if type(text) == str: # only accept immutable objects
                         self._cache = (node, curr, text)
                     self._basecache = (curr, chainbase)
                     return node
                 def _writeentry(self, transaction, ifh, dfh, entry, data, link, offset):
                     curr = len(self) - 1
                     if not self._inline:
                         transaction.add(self.datafile, offset)
                         transaction.add(self.indexfile, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         dfh.flush()
                         ifh.write(entry)
                     else:
                         offset += curr * self._io.size
                         transaction.add(self.indexfile, offset, curr)
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                         self.checkinlinesize(transaction, ifh)
                 def addgroup(self, bundle, linkmapper, transaction):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     """
                     # track the base of the current delta log
                     content = []
                     node = None
                     r = len(self)
                     end = 0
                     if r:
                         end = self.end(r - 1)
                     ifh = self.opener(self.indexfile, "a+")
                     isize = r * self._io.size
                     if self._inline:
                         transaction.add(self.indexfile, end + isize, r)
                         dfh = None
                     else:
                         transaction.add(self.indexfile, isize, r)
                         transaction.add(self.datafile, end)
                         dfh = self.opener(self.datafile, "a")
                     try:
                         # loop through our set of deltas
                         chain = None
                         while True:
                             chunkdata = bundle.deltachunk(chain)
                             if not chunkdata:
                                 break
                             node = chunkdata['node']
                             p1 = chunkdata['p1']
                             p2 = chunkdata['p2']
                             cs = chunkdata['cs']
                             deltabase = chunkdata['deltabase']
                             delta = chunkdata['delta']
                             content.append(node)
                             link = linkmapper(cs)
                             if node in self.nodemap:
                                 # this can happen if two branches make the same change
                                 chain = node
                                 continue
                             for p in (p1, p2):
                                 if p not in self.nodemap:
                                     raise LookupError(p, self.indexfile,
                                                       _('unknown parent'))
                             if deltabase not in self.nodemap:
                                 raise LookupError(deltabase, self.indexfile,
                                                   _('unknown delta base'))
                             baserev = self.rev(deltabase)
                             chain = self._addrevision(node, None, transaction, link,
                                                       p1, p2, (baserev, delta), ifh, dfh)
                             if not dfh and not self._inline:
                                 # addrevision switched from inline to conventional
                                 # reopen the index
                                 ifh.close()
                                 dfh = self.opener(self.datafile, "a")
                                 ifh = self.opener(self.indexfile, "a")
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                     return content
                 def getstrippoint(self, minlink):
                     """find the minimum rev that must be stripped to strip the linkrev
                     Returns a tuple containing the minimum rev and a set of all revs that
                     have linkrevs that will be broken by this strip.
                     """
                     brokenrevs = set()
                     strippoint = len(self)
                     heads = {}
                     futurelargelinkrevs = set()
                     for head in self.headrevs():
                         headlinkrev = self.linkrev(head)
                         heads[head] = headlinkrev
                         if headlinkrev >= minlink:
                             futurelargelinkrevs.add(headlinkrev)
                     # This algorithm involves walking down the rev graph, starting at the
                     # heads. Since the revs are topologically sorted according to linkrev,
                     # once all head linkrevs are below the minlink, we know there are
                     # no more revs that could have a linkrev greater than minlink.
                     # So we can stop walking.
                     while futurelargelinkrevs:
                         strippoint -= 1
                         linkrev = heads.pop(strippoint)
                         if linkrev < minlink:
                             brokenrevs.add(strippoint)
                         else:
                             futurelargelinkrevs.remove(linkrev)
                         for p in self.parentrevs(strippoint):
                             if p != nullrev:
                                 plinkrev = self.linkrev(p)
                                 heads[p] = plinkrev
                                 if plinkrev >= minlink:
                                     futurelargelinkrevs.add(plinkrev)
                     return strippoint, brokenrevs
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll re-add them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     rev, _ = self.getstrippoint(minlink)
                     if rev == len(self):
                         return
                     # first truncate the files on disk
                     end = self.start(rev)
                     if not self._inline:
                         transaction.add(self.datafile, end)
                         end = rev * self._io.size
                     else:
                         end += rev * self._io.size
                     transaction.add(self.indexfile, end)
                     # then reset internal state in memory to forget those revisions
                     self._cache = None
                     self._chunkclear()
                     for x in xrange(rev, len(self)):
                         del self.nodemap[self.node(x)]
                     del self.index[rev:-1]
                 def checksize(self):
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         f = self.opener(self.datafile)
                         f.seek(0, 2)
                         actual = f.tell()
                         f.close()
                         dd = actual - expected
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         dd = 0
                     try:
                         f = self.opener(self.indexfile)
                         f.seek(0, 2)
                         actual = f.tell()
                         f.close()
                         s = self._io.size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         di = 0
                     return (dd, di)
                 def files(self):
                     res = [self.indexfile]
                     if not self._inline:
                         res.append(self.datafile)
                     return res