upstream/mercurial-mirror Commit - r21107:4a6c8b6b

1

# revlog.py - storage back-end for mercurial

1

# revlog.py - storage back-end for mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

"""Storage back-end for Mercurial.

8

"""Storage back-end for Mercurial.

9

10

This provides efficient delta storage with O(1) retrieve and append

10

This provides efficient delta storage with O(1) retrieve and append

11

and O(changes) merge between branches.

11

and O(changes) merge between branches.

12

"""

12

"""

13

14

# import stuff from node for others to import from revlog

14

# import stuff from node for others to import from revlog

15

from node import bin, hex, nullid, nullrev

15

from node import bin, hex, nullid, nullrev

16

from i18n import _

16

from i18n import _

17

import ancestor, mdiff, parsers, error, util, templatefilters

17

import ancestor, mdiff, parsers, error, util, templatefilters

18

import struct, zlib, errno

18

import struct, zlib, errno

19

20

_pack = struct.pack

20

_pack = struct.pack

21

_unpack = struct.unpack

21

_unpack = struct.unpack

22

_compress = zlib.compress

22

_compress = zlib.compress

23

_decompress = zlib.decompress

23

_decompress = zlib.decompress

24

_sha = util.sha1

24

_sha = util.sha1

25

26

# revlog header flags

26

# revlog header flags

27

REVLOGV0 = 0

27

REVLOGV0 = 0

28

REVLOGNG = 1

28

REVLOGNG = 1

29

REVLOGNGINLINEDATA = (1 << 16)

29

REVLOGNGINLINEDATA = (1 << 16)

30

REVLOGGENERALDELTA = (1 << 17)

30

REVLOGGENERALDELTA = (1 << 17)

31

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

31

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

32

REVLOG_DEFAULT_FORMAT = REVLOGNG

32

REVLOG_DEFAULT_FORMAT = REVLOGNG

33

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

33

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

34

REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGGENERALDELTA

34

REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGGENERALDELTA

35

36

# revlog index flags

36

# revlog index flags

37

REVIDX_KNOWN_FLAGS = 0

37

REVIDX_KNOWN_FLAGS = 0

38

39

# max size of revlog with inline data

39

# max size of revlog with inline data

40

_maxinline = 131072

40

_maxinline = 131072

41

_chunksize = 1048576

41

_chunksize = 1048576

42

43

RevlogError = error.RevlogError

43

RevlogError = error.RevlogError

44

LookupError = error.LookupError

44

LookupError = error.LookupError

45

46

def getoffset(q):

46

def getoffset(q):

47

return int(q >> 16)

47

return int(q >> 16)

48

49

def gettype(q):

49

def gettype(q):

50

return int(q & 0xFFFF)

50

return int(q & 0xFFFF)

51

52

def offset_type(offset, type):

52

def offset_type(offset, type):

53

return long(long(offset) << 16 | type)

53

return long(long(offset) << 16 | type)

54

55

nullhash = _sha(nullid)

55

nullhash = _sha(nullid)

56

57

def hash(text, p1, p2):

57

def hash(text, p1, p2):

58

"""generate a hash from the given text and its parent hashes

58

"""generate a hash from the given text and its parent hashes

59

60

This hash combines both the current file contents and its history

60

This hash combines both the current file contents and its history

61

in a manner that makes it easy to distinguish nodes with the same

61

in a manner that makes it easy to distinguish nodes with the same

62

content in the revision graph.

62

content in the revision graph.

63

"""

63

"""

64

# As of now, if one of the parent node is null, p2 is null

64

# As of now, if one of the parent node is null, p2 is null

65

if p2 == nullid:

65

if p2 == nullid:

66

# deep copy of a hash is faster than creating one

66

# deep copy of a hash is faster than creating one

67

s = nullhash.copy()

67

s = nullhash.copy()

68

s.update(p1)

68

s.update(p1)

69

else:

69

else:

70

# none of the parent nodes are nullid

70

# none of the parent nodes are nullid

71

l = [p1, p2]

71

l = [p1, p2]

72

l.sort()

72

l.sort()

73

s = _sha(l[0])

73

s = _sha(l[0])

74

s.update(l[1])

74

s.update(l[1])

75

s.update(text)

75

s.update(text)

76

return s.digest()

76

return s.digest()

77

78

def decompress(bin):

78

def decompress(bin):

79

""" decompress the given input """

79

""" decompress the given input """

80

if not bin:

80

if not bin:

81

return bin

81

return bin

82

t = bin[0]

82

t = bin[0]

83

if t == '\0':

83

if t == '\0':

84

return bin

84

return bin

85

if t == 'x':

85

if t == 'x':

86

try:

86

try:

87

return _decompress(bin)

87

return _decompress(bin)

88

except zlib.error, e:

88

except zlib.error, e:

89

raise RevlogError(_("revlog decompress error: %s") % str(e))

89

raise RevlogError(_("revlog decompress error: %s") % str(e))

90

if t == 'u':

90

if t == 'u':

91

return bin[1:]

91

return bin[1:]

92

raise RevlogError(_("unknown compression type %r") % t)

92

raise RevlogError(_("unknown compression type %r") % t)

93

94

# index v0:

94

# index v0:

95

# 4 bytes: offset

95

# 4 bytes: offset

96

# 4 bytes: compressed length

96

# 4 bytes: compressed length

97

# 4 bytes: base rev

97

# 4 bytes: base rev

98

# 4 bytes: link rev

98

# 4 bytes: link rev

99

# 32 bytes: parent 1 nodeid

99

# 32 bytes: parent 1 nodeid

100

# 32 bytes: parent 2 nodeid

100

# 32 bytes: parent 2 nodeid

101

# 32 bytes: nodeid

101

# 32 bytes: nodeid

102

indexformatv0 = ">4l20s20s20s"

102

indexformatv0 = ">4l20s20s20s"

103

v0shaoffset = 56

103

v0shaoffset = 56

104

105

class revlogoldio(object):

105

class revlogoldio(object):

106

def __init__(self):

106

def __init__(self):

107

self.size = struct.calcsize(indexformatv0)

107

self.size = struct.calcsize(indexformatv0)

108

109

def parseindex(self, data, inline):

109

def parseindex(self, data, inline):

110

s = self.size

110

s = self.size

111

index = []

111

index = []

112

nodemap = {nullid: nullrev}

112

nodemap = {nullid: nullrev}

113

n = off = 0

113

n = off = 0

114

l = len(data)

114

l = len(data)

115

while off + s <= l:

115

while off + s <= l:

116

cur = data[off:off + s]

116

cur = data[off:off + s]

117

off += s

117

off += s

118

e = _unpack(indexformatv0, cur)

118

e = _unpack(indexformatv0, cur)

119

# transform to revlogv1 format

119

# transform to revlogv1 format

120

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

120

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

121

nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])

121

nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])

122

index.append(e2)

122

index.append(e2)

123

nodemap[e[6]] = n

123

nodemap[e[6]] = n

124

n += 1

124

n += 1

125

126

# add the magic null revision at -1

126

# add the magic null revision at -1

127

index.append((0, 0, 0, -1, -1, -1, -1, nullid))

127

index.append((0, 0, 0, -1, -1, -1, -1, nullid))

128

129

return index, nodemap, None

129

return index, nodemap, None

130

131

def packentry(self, entry, node, version, rev):

131

def packentry(self, entry, node, version, rev):

132

if gettype(entry[0]):

132

if gettype(entry[0]):

133

raise RevlogError(_("index entry flags need RevlogNG"))

133

raise RevlogError(_("index entry flags need RevlogNG"))

134

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

134

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

135

node(entry[5]), node(entry[6]), entry[7])

135

node(entry[5]), node(entry[6]), entry[7])

136

return _pack(indexformatv0, *e2)

136

return _pack(indexformatv0, *e2)

137

138

# index ng:

138

# index ng:

139

# 6 bytes: offset

139

# 6 bytes: offset

140

# 2 bytes: flags

140

# 2 bytes: flags

141

# 4 bytes: compressed length

141

# 4 bytes: compressed length

142

# 4 bytes: uncompressed length

142

# 4 bytes: uncompressed length

143

# 4 bytes: base rev

143

# 4 bytes: base rev

144

# 4 bytes: link rev

144

# 4 bytes: link rev

145

# 4 bytes: parent 1 rev

145

# 4 bytes: parent 1 rev

146

# 4 bytes: parent 2 rev

146

# 4 bytes: parent 2 rev

147

# 32 bytes: nodeid

147

# 32 bytes: nodeid

148

indexformatng = ">Qiiiiii20s12x"

148

indexformatng = ">Qiiiiii20s12x"

149

ngshaoffset = 32

149

ngshaoffset = 32

150

versionformat = ">I"

150

versionformat = ">I"

151

152

class revlogio(object):

152

class revlogio(object):

153

def __init__(self):

153

def __init__(self):

154

self.size = struct.calcsize(indexformatng)

154

self.size = struct.calcsize(indexformatng)

155

156

def parseindex(self, data, inline):

156

def parseindex(self, data, inline):

157

# call the C implementation to parse the index data

157

# call the C implementation to parse the index data

158

index, cache = parsers.parse_index2(data, inline)

158

index, cache = parsers.parse_index2(data, inline)

159

return index, getattr(index, 'nodemap', None), cache

159

return index, getattr(index, 'nodemap', None), cache

160

161

def packentry(self, entry, node, version, rev):

161

def packentry(self, entry, node, version, rev):

162

p = _pack(indexformatng, *entry)

162

p = _pack(indexformatng, *entry)

163

if rev == 0:

163

if rev == 0:

164

p = _pack(versionformat, version) + p[4:]

164

p = _pack(versionformat, version) + p[4:]

165

return p

165

return p

166

167

class revlog(object):

167

class revlog(object):

168

"""

168

"""

169

the underlying revision storage object

169

the underlying revision storage object

170

171

A revlog consists of two parts, an index and the revision data.

171

A revlog consists of two parts, an index and the revision data.

172

173

The index is a file with a fixed record size containing

173

The index is a file with a fixed record size containing

174

information on each revision, including its nodeid (hash), the

174

information on each revision, including its nodeid (hash), the

175

nodeids of its parents, the position and offset of its data within

175

nodeids of its parents, the position and offset of its data within

176

the data file, and the revision it's based on. Finally, each entry

176

the data file, and the revision it's based on. Finally, each entry

177

contains a linkrev entry that can serve as a pointer to external

177

contains a linkrev entry that can serve as a pointer to external

178

data.

178

data.

179

180

The revision data itself is a linear collection of data chunks.

180

The revision data itself is a linear collection of data chunks.

181

Each chunk represents a revision and is usually represented as a

181

Each chunk represents a revision and is usually represented as a

182

delta against the previous chunk. To bound lookup time, runs of

182

delta against the previous chunk. To bound lookup time, runs of

183

deltas are limited to about 2 times the length of the original

183

deltas are limited to about 2 times the length of the original

184

version data. This makes retrieval of a version proportional to

184

version data. This makes retrieval of a version proportional to

185

its size, or O(1) relative to the number of revisions.

185

its size, or O(1) relative to the number of revisions.

186

187

Both pieces of the revlog are written to in an append-only

187

Both pieces of the revlog are written to in an append-only

188

fashion, which means we never need to rewrite a file to insert or

188

fashion, which means we never need to rewrite a file to insert or

189

remove data, and can use some simple techniques to avoid the need

189

remove data, and can use some simple techniques to avoid the need

190

for locking while reading.

190

for locking while reading.

191

"""

191

"""

192

def __init__(self, opener, indexfile):

192

def __init__(self, opener, indexfile):

193

"""

193

"""

194

create a revlog object

194

create a revlog object

195

196

opener is a function that abstracts the file opening operation

196

opener is a function that abstracts the file opening operation

197

and can be used to implement COW semantics or the like.

197

and can be used to implement COW semantics or the like.

198

"""

198

"""

199

self.indexfile = indexfile

199

self.indexfile = indexfile

200

self.datafile = indexfile[:-2] + ".d"

200

self.datafile = indexfile[:-2] + ".d"

201

self.opener = opener

201

self.opener = opener

202

self._cache = None

202

self._cache = None

203

self._basecache = None

203

self._basecache = None

204

self._chunkcache = (0, '')

204

self._chunkcache = (0, '')

205

self._chunkcachesize = 65536

205

self._chunkcachesize = 65536

206

self.index = []

206

self.index = []

207

self._pcache = {}

207

self._pcache = {}

208

self._nodecache = {nullid: nullrev}

208

self._nodecache = {nullid: nullrev}

209

self._nodepos = None

209

self._nodepos = None

210

211

v = REVLOG_DEFAULT_VERSION

211

v = REVLOG_DEFAULT_VERSION

212

opts = getattr(opener, 'options', None)

212

opts = getattr(opener, 'options', None)

213

if opts is not None:

213

if opts is not None:

214

if 'revlogv1' in opts:

214

if 'revlogv1' in opts:

215

if 'generaldelta' in opts:

215

if 'generaldelta' in opts:

216

v |= REVLOGGENERALDELTA

216

v |= REVLOGGENERALDELTA

217

else:

217

else:

218

v = 0

218

v = 0

219

if 'chunkcachesize' in opts:

219

if 'chunkcachesize' in opts:

220

self._chunkcachesize = opts['chunkcachesize']

220

self._chunkcachesize = opts['chunkcachesize']

221

222

if self._chunkcachesize <= 0:

222

if self._chunkcachesize <= 0:

223

raise RevlogError(_('revlog chunk cache size %r is not greater '

223

raise RevlogError(_('revlog chunk cache size %r is not greater '

224

'than 0') % self._chunkcachesize)

224

'than 0') % self._chunkcachesize)

225

elif self._chunkcachesize & (self._chunkcachesize - 1):

225

elif self._chunkcachesize & (self._chunkcachesize - 1):

226

raise RevlogError(_('revlog chunk cache size %r is not a power '

226

raise RevlogError(_('revlog chunk cache size %r is not a power '

227

'of 2') % self._chunkcachesize)

227

'of 2') % self._chunkcachesize)

228

229

i = ''

229

i = ''

230

self._initempty = True

230

self._initempty = True

231

try:

231

try:

232

f = self.opener(self.indexfile)

232

f = self.opener(self.indexfile)

233

i = f.read()

233

i = f.read()

234

f.close()

234

f.close()

235

if len(i) > 0:

235

if len(i) > 0:

236

v = struct.unpack(versionformat, i[:4])[0]

236

v = struct.unpack(versionformat, i[:4])[0]

237

self._initempty = False

237

self._initempty = False

238

except IOError, inst:

238

except IOError, inst:

239

if inst.errno != errno.ENOENT:

239

if inst.errno != errno.ENOENT:

240

raise

240

raise

241

242

self.version = v

242

self.version = v

243

self._inline = v & REVLOGNGINLINEDATA

243

self._inline = v & REVLOGNGINLINEDATA

244

self._generaldelta = v & REVLOGGENERALDELTA

244

self._generaldelta = v & REVLOGGENERALDELTA

245

flags = v & ~0xFFFF

245

flags = v & ~0xFFFF

246

fmt = v & 0xFFFF

246

fmt = v & 0xFFFF

247

if fmt == REVLOGV0 and flags:

247

if fmt == REVLOGV0 and flags:

248

raise RevlogError(_("index %s unknown flags %#04x for format v0")

248

raise RevlogError(_("index %s unknown flags %#04x for format v0")

249

% (self.indexfile, flags >> 16))

249

% (self.indexfile, flags >> 16))

250

elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:

250

elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:

251

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

251

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

252

% (self.indexfile, flags >> 16))

252

% (self.indexfile, flags >> 16))

253

elif fmt > REVLOGNG:

253

elif fmt > REVLOGNG:

254

raise RevlogError(_("index %s unknown format %d")

254

raise RevlogError(_("index %s unknown format %d")

255

% (self.indexfile, fmt))

255

% (self.indexfile, fmt))

256

257

self._io = revlogio()

257

self._io = revlogio()

258

if self.version == REVLOGV0:

258

if self.version == REVLOGV0:

259

self._io = revlogoldio()

259

self._io = revlogoldio()

260

try:

260

try:

261

d = self._io.parseindex(i, self._inline)

261

d = self._io.parseindex(i, self._inline)

262

except (ValueError, IndexError):

262

except (ValueError, IndexError):

263

raise RevlogError(_("index %s is corrupted") % (self.indexfile))

263

raise RevlogError(_("index %s is corrupted") % (self.indexfile))

264

self.index, nodemap, self._chunkcache = d

264

self.index, nodemap, self._chunkcache = d

265

if nodemap is not None:

265

if nodemap is not None:

266

self.nodemap = self._nodecache = nodemap

266

self.nodemap = self._nodecache = nodemap

267

if not self._chunkcache:

267

if not self._chunkcache:

268

self._chunkclear()

268

self._chunkclear()

269

270

def tip(self):

270

def tip(self):

271

return self.node(len(self.index) - 2)

271

return self.node(len(self.index) - 2)

272

def __len__(self):

272

def __len__(self):

273

return len(self.index) - 1

273

return len(self.index) - 1

274

def __iter__(self):

274

def __iter__(self):

275

return iter(xrange(len(self)))

275

return iter(xrange(len(self)))

276

def revs(self, start=0, stop=None):

276

def revs(self, start=0, stop=None):

277

"""iterate over all rev in this revlog (from start to stop)"""

277

"""iterate over all rev in this revlog (from start to stop)"""

278

step = 1

278

step = 1

279

if stop is not None:

279

if stop is not None:

280

if start > stop:

280

if start > stop:

281

step = -1

281

step = -1

282

stop += step

282

stop += step

283

else:

283

else:

284

stop = len(self)

284

stop = len(self)

285

return xrange(start, stop, step)

285

return xrange(start, stop, step)

286

287

@util.propertycache

287

@util.propertycache

288

def nodemap(self):

288

def nodemap(self):

289

self.rev(self.node(0))

289

self.rev(self.node(0))

290

return self._nodecache

290

return self._nodecache

291

292

def hasnode(self, node):

292

def hasnode(self, node):

293

try:

293

try:

294

self.rev(node)

294

self.rev(node)

295

return True

295

return True

296

except KeyError:

296

except KeyError:

297

return False

297

return False

298

299

def clearcaches(self):

299

def clearcaches(self):

300

try:

300

try:

301

self._nodecache.clearcaches()

301

self._nodecache.clearcaches()

302

except AttributeError:

302

except AttributeError:

303

self._nodecache = {nullid: nullrev}

303

self._nodecache = {nullid: nullrev}

304

self._nodepos = None

304

self._nodepos = None

305

306

def rev(self, node):

306

def rev(self, node):

307

try:

307

try:

308

return self._nodecache[node]

308

return self._nodecache[node]

309

except RevlogError:

309

except RevlogError:

310

# parsers.c radix tree lookup failed

310

# parsers.c radix tree lookup failed

311

raise LookupError(node, self.indexfile, _('no node'))

311

raise LookupError(node, self.indexfile, _('no node'))

312

except KeyError:

312

except KeyError:

313

# pure python cache lookup failed

313

# pure python cache lookup failed

314

n = self._nodecache

314

n = self._nodecache

315

i = self.index

315

i = self.index

316

p = self._nodepos

316

p = self._nodepos

317

if p is None:

317

if p is None:

318

p = len(i) - 2

318

p = len(i) - 2

319

for r in xrange(p, -1, -1):

319

for r in xrange(p, -1, -1):

320

v = i[r][7]

320

v = i[r][7]

321

n[v] = r

321

n[v] = r

322

if v == node:

322

if v == node:

323

self._nodepos = r - 1

323

self._nodepos = r - 1

324

return r

324

return r

325

raise LookupError(node, self.indexfile, _('no node'))

325

raise LookupError(node, self.indexfile, _('no node'))

326

327

def node(self, rev):

327

def node(self, rev):

328

return self.index[rev][7]

328

return self.index[rev][7]

329

def linkrev(self, rev):

329

def linkrev(self, rev):

330

return self.index[rev][4]

330

return self.index[rev][4]

331

def parents(self, node):

331

def parents(self, node):

332

i = self.index

332

i = self.index

333

d = i[self.rev(node)]

333

d = i[self.rev(node)]

334

return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline

334

return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline

335

def parentrevs(self, rev):

335

def parentrevs(self, rev):

336

return self.index[rev][5:7]

336

return self.index[rev][5:7]

337

def start(self, rev):

337

def start(self, rev):

338

return int(self.index[rev][0] >> 16)

338

return int(self.index[rev][0] >> 16)

339

def end(self, rev):

339

def end(self, rev):

340

return self.start(rev) + self.length(rev)

340

return self.start(rev) + self.length(rev)

341

def length(self, rev):

341

def length(self, rev):

342

return self.index[rev][1]

342

return self.index[rev][1]

343

def chainbase(self, rev):

343

def chainbase(self, rev):

344

index = self.index

344

index = self.index

345

base = index[rev][3]

345

base = index[rev][3]

346

while base != rev:

346

while base != rev:

347

rev = base

347

rev = base

348

base = index[rev][3]

348

base = index[rev][3]

349

return base

349

return base

350

def flags(self, rev):

350

def flags(self, rev):

351

return self.index[rev][0] & 0xFFFF

351

return self.index[rev][0] & 0xFFFF

352

def rawsize(self, rev):

352

def rawsize(self, rev):

353

"""return the length of the uncompressed text for a given revision"""

353

"""return the length of the uncompressed text for a given revision"""

354

l = self.index[rev][2]

354

l = self.index[rev][2]

355

if l >= 0:

355

if l >= 0:

356

return l

356

return l

357

358

t = self.revision(self.node(rev))

358

t = self.revision(self.node(rev))

359

return len(t)

359

return len(t)

360

size = rawsize

360

size = rawsize

361

362

def ancestors(self, revs, stoprev=0, inclusive=False):

362

def ancestors(self, revs, stoprev=0, inclusive=False):

363

"""Generate the ancestors of 'revs' in reverse topological order.

363

"""Generate the ancestors of 'revs' in reverse topological order.

364

Does not generate revs lower than stoprev.

364

Does not generate revs lower than stoprev.

365

366

See the documentation for ancestor.lazyancestors for more details."""

366

See the documentation for ancestor.lazyancestors for more details."""

367

368

return ancestor.lazyancestors(self, revs, stoprev=stoprev,

368

return ancestor.lazyancestors(self, revs, stoprev=stoprev,

369

inclusive=inclusive)

369

inclusive=inclusive)

370

371

def descendants(self, revs):

371

def descendants(self, revs):

372

"""Generate the descendants of 'revs' in revision order.

372

"""Generate the descendants of 'revs' in revision order.

373

374

Yield a sequence of revision numbers starting with a child of

374

Yield a sequence of revision numbers starting with a child of

375

some rev in revs, i.e., each revision is *not* considered a

375

some rev in revs, i.e., each revision is *not* considered a

376

descendant of itself. Results are ordered by revision number (a

376

descendant of itself. Results are ordered by revision number (a

377

topological sort)."""

377

topological sort)."""

378

first = min(revs)

378

first = min(revs)

379

if first == nullrev:

379

if first == nullrev:

380

for i in self:

380

for i in self:

381

yield i

381

yield i

382

return

382

return

383

384

seen = set(revs)

384

seen = set(revs)

385

for i in self.revs(start=first + 1):

385

for i in self.revs(start=first + 1):

386

for x in self.parentrevs(i):

386

for x in self.parentrevs(i):

387

if x != nullrev and x in seen:

387

if x != nullrev and x in seen:

388

seen.add(i)

388

seen.add(i)

389

yield i

389

yield i

390

break

390

break

391

392

def findcommonmissing(self, common=None, heads=None):

392

def findcommonmissing(self, common=None, heads=None):

393

"""Return a tuple of the ancestors of common and the ancestors of heads

393

"""Return a tuple of the ancestors of common and the ancestors of heads

394

that are not ancestors of common. In revset terminology, we return the

394

that are not ancestors of common. In revset terminology, we return the

395

tuple:

395

tuple:

396

397

::common, (::heads) - (::common)

397

::common, (::heads) - (::common)

398

399

The list is sorted by revision number, meaning it is

399

The list is sorted by revision number, meaning it is

400

topologically sorted.

400

topologically sorted.

401

402

'heads' and 'common' are both lists of node IDs. If heads is

402

'heads' and 'common' are both lists of node IDs. If heads is

403

not supplied, uses all of the revlog's heads. If common is not

403

not supplied, uses all of the revlog's heads. If common is not

404

supplied, uses nullid."""

404

supplied, uses nullid."""

405

if common is None:

405

if common is None:

406

common = [nullid]

406

common = [nullid]

407

if heads is None:

407

if heads is None:

408

heads = self.heads()

408

heads = self.heads()

409

410

common = [self.rev(n) for n in common]

410

common = [self.rev(n) for n in common]

411

heads = [self.rev(n) for n in heads]

411

heads = [self.rev(n) for n in heads]

412

413

# we want the ancestors, but inclusive

413

# we want the ancestors, but inclusive

414

class lazyset(object):

414

class lazyset(object):

415

def __init__(self, lazyvalues):

415

def __init__(self, lazyvalues):

416

self.addedvalues = set()

416

self.addedvalues = set()

417

self.lazyvalues = lazyvalues

417

self.lazyvalues = lazyvalues

418

419

def __contains__(self, value):

419

def __contains__(self, value):

420

return value in self.addedvalues or value in self.lazyvalues

420

return value in self.addedvalues or value in self.lazyvalues

421

422

def __iter__(self):

422

def __iter__(self):

423

added = self.addedvalues

423

added = self.addedvalues

424

for r in added:

424

for r in added:

425

yield r

425

yield r

426

for r in self.lazyvalues:

426

for r in self.lazyvalues:

427

if not r in added:

427

if not r in added:

428

yield r

428

yield r

429

430

def add(self, value):

430

def add(self, value):

431

self.addedvalues.add(value)

431

self.addedvalues.add(value)

432

433

def update(self, values):

433

def update(self, values):

434

self.addedvalues.update(values)

434

self.addedvalues.update(values)

435

436

has = lazyset(self.ancestors(common))

436

has = lazyset(self.ancestors(common))

437

has.add(nullrev)

437

has.add(nullrev)

438

has.update(common)

438

has.update(common)

439

440

# take all ancestors from heads that aren't in has

440

# take all ancestors from heads that aren't in has

441

missing = set()

441

missing = set()

442

visit = util.deque(r for r in heads if r not in has)

442

visit = util.deque(r for r in heads if r not in has)

443

while visit:

443

while visit:

444

r = visit.popleft()

444

r = visit.popleft()

445

if r in missing:

445

if r in missing:

446

continue

446

continue

447

else:

447

else:

448

missing.add(r)

448

missing.add(r)

449

for p in self.parentrevs(r):

449

for p in self.parentrevs(r):

450

if p not in has:

450

if p not in has:

451

visit.append(p)

451

visit.append(p)

452

missing = list(missing)

452

missing = list(missing)

453

missing.sort()

453

missing.sort()

454

return has, [self.node(r) for r in missing]

454

return has, [self.node(r) for r in missing]

455

456

def findmissingrevs(self, common=None, heads=None):

456

def findmissingrevs(self, common=None, heads=None):

457

"""Return the revision numbers of the ancestors of heads that

457

"""Return the revision numbers of the ancestors of heads that

458

are not ancestors of common.

458

are not ancestors of common.

459

460

More specifically, return a list of revision numbers corresponding to

460

More specifically, return a list of revision numbers corresponding to

461

nodes N such that every N satisfies the following constraints:

461

nodes N such that every N satisfies the following constraints:

462

463

1. N is an ancestor of some node in 'heads'

463

1. N is an ancestor of some node in 'heads'

464

2. N is not an ancestor of any node in 'common'

464

2. N is not an ancestor of any node in 'common'

465

466

The list is sorted by revision number, meaning it is

466

The list is sorted by revision number, meaning it is

467

topologically sorted.

467

topologically sorted.

468

469

'heads' and 'common' are both lists of revision numbers. If heads is

469

'heads' and 'common' are both lists of revision numbers. If heads is

470

not supplied, uses all of the revlog's heads. If common is not

470

not supplied, uses all of the revlog's heads. If common is not

471

supplied, uses nullid."""

471

supplied, uses nullid."""

472

if common is None:

472

if common is None:

473

common = [nullrev]

473

common = [nullrev]

474

if heads is None:

474

if heads is None:

475

heads = self.headrevs()

475

heads = self.headrevs()

476

477

return ancestor.missingancestors(heads, common, self.parentrevs)

477

return ancestor.missingancestors(heads, common, self.parentrevs)

478

479

def findmissing(self, common=None, heads=None):

479

def findmissing(self, common=None, heads=None):

480

"""Return the ancestors of heads that are not ancestors of common.

480

"""Return the ancestors of heads that are not ancestors of common.

481

482

More specifically, return a list of nodes N such that every N

482

More specifically, return a list of nodes N such that every N

483

satisfies the following constraints:

483

satisfies the following constraints:

484

485

1. N is an ancestor of some node in 'heads'

485

1. N is an ancestor of some node in 'heads'

486

2. N is not an ancestor of any node in 'common'

486

2. N is not an ancestor of any node in 'common'

487

488

The list is sorted by revision number, meaning it is

488

The list is sorted by revision number, meaning it is

489

topologically sorted.

489

topologically sorted.

490

491

'heads' and 'common' are both lists of node IDs. If heads is

491

'heads' and 'common' are both lists of node IDs. If heads is

492

not supplied, uses all of the revlog's heads. If common is not

492

not supplied, uses all of the revlog's heads. If common is not

493

supplied, uses nullid."""

493

supplied, uses nullid."""

494

if common is None:

494

if common is None:

495

common = [nullid]

495

common = [nullid]

496

if heads is None:

496

if heads is None:

497

heads = self.heads()

497

heads = self.heads()

498

499

common = [self.rev(n) for n in common]

499

common = [self.rev(n) for n in common]

500

heads = [self.rev(n) for n in heads]

500

heads = [self.rev(n) for n in heads]

501

502

return [self.node(r) for r in

502

return [self.node(r) for r in

503

ancestor.missingancestors(heads, common, self.parentrevs)]

503

ancestor.missingancestors(heads, common, self.parentrevs)]

504

505

def nodesbetween(self, roots=None, heads=None):

505

def nodesbetween(self, roots=None, heads=None):

506

"""Return a topological path from 'roots' to 'heads'.

506

"""Return a topological path from 'roots' to 'heads'.

507

508

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

508

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

509

topologically sorted list of all nodes N that satisfy both of

509

topologically sorted list of all nodes N that satisfy both of

510

these constraints:

510

these constraints:

511

512

1. N is a descendant of some node in 'roots'

512

1. N is a descendant of some node in 'roots'

513

2. N is an ancestor of some node in 'heads'

513

2. N is an ancestor of some node in 'heads'

514

515

Every node is considered to be both a descendant and an ancestor

515

Every node is considered to be both a descendant and an ancestor

516

of itself, so every reachable node in 'roots' and 'heads' will be

516

of itself, so every reachable node in 'roots' and 'heads' will be

517

included in 'nodes'.

517

included in 'nodes'.

518

519

'outroots' is the list of reachable nodes in 'roots', i.e., the

519

'outroots' is the list of reachable nodes in 'roots', i.e., the

520

subset of 'roots' that is returned in 'nodes'. Likewise,

520

subset of 'roots' that is returned in 'nodes'. Likewise,

521

'outheads' is the subset of 'heads' that is also in 'nodes'.

521

'outheads' is the subset of 'heads' that is also in 'nodes'.

522

523

'roots' and 'heads' are both lists of node IDs. If 'roots' is

523

'roots' and 'heads' are both lists of node IDs. If 'roots' is

524

unspecified, uses nullid as the only root. If 'heads' is

524

unspecified, uses nullid as the only root. If 'heads' is

525

unspecified, uses list of all of the revlog's heads."""

525

unspecified, uses list of all of the revlog's heads."""

526

nonodes = ([], [], [])

526

nonodes = ([], [], [])

527

if roots is not None:

527

if roots is not None:

528

roots = list(roots)

528

roots = list(roots)

529

if not roots:

529

if not roots:

530

return nonodes

530

return nonodes

531

lowestrev = min([self.rev(n) for n in roots])

531

lowestrev = min([self.rev(n) for n in roots])

532

else:

532

else:

533

roots = [nullid] # Everybody's a descendant of nullid

533

roots = [nullid] # Everybody's a descendant of nullid

534

lowestrev = nullrev

534

lowestrev = nullrev

535

if (lowestrev == nullrev) and (heads is None):

535

if (lowestrev == nullrev) and (heads is None):

536

# We want _all_ the nodes!

536

# We want _all_ the nodes!

537

return ([self.node(r) for r in self], [nullid], list(self.heads()))

537

return ([self.node(r) for r in self], [nullid], list(self.heads()))

538

if heads is None:

538

if heads is None:

539

# All nodes are ancestors, so the latest ancestor is the last

539

# All nodes are ancestors, so the latest ancestor is the last

540

# node.

540

# node.

541

highestrev = len(self) - 1

541

highestrev = len(self) - 1

542

# Set ancestors to None to signal that every node is an ancestor.

542

# Set ancestors to None to signal that every node is an ancestor.

543

ancestors = None

543

ancestors = None

544

# Set heads to an empty dictionary for later discovery of heads

544

# Set heads to an empty dictionary for later discovery of heads

545

heads = {}

545

heads = {}

546

else:

546

else:

547

heads = list(heads)

547

heads = list(heads)

548

if not heads:

548

if not heads:

549

return nonodes

549

return nonodes

550

ancestors = set()

550

ancestors = set()

551

# Turn heads into a dictionary so we can remove 'fake' heads.

551

# Turn heads into a dictionary so we can remove 'fake' heads.

552

# Also, later we will be using it to filter out the heads we can't

552

# Also, later we will be using it to filter out the heads we can't

553

# find from roots.

553

# find from roots.

554

heads = dict.fromkeys(heads, False)

554

heads = dict.fromkeys(heads, False)

555

# Start at the top and keep marking parents until we're done.

555

# Start at the top and keep marking parents until we're done.

556

nodestotag = set(heads)

556

nodestotag = set(heads)

557

# Remember where the top was so we can use it as a limit later.

557

# Remember where the top was so we can use it as a limit later.

558

highestrev = max([self.rev(n) for n in nodestotag])

558

highestrev = max([self.rev(n) for n in nodestotag])

559

while nodestotag:

559

while nodestotag:

560

# grab a node to tag

560

# grab a node to tag

561

n = nodestotag.pop()

561

n = nodestotag.pop()

562

# Never tag nullid

562

# Never tag nullid

563

if n == nullid:

563

if n == nullid:

564

continue

564

continue

565

# A node's revision number represents its place in a

565

# A node's revision number represents its place in a

566

# topologically sorted list of nodes.

566

# topologically sorted list of nodes.

567

r = self.rev(n)

567

r = self.rev(n)

568

if r >= lowestrev:

568

if r >= lowestrev:

569

if n not in ancestors:

569

if n not in ancestors:

570

# If we are possibly a descendant of one of the roots

570

# If we are possibly a descendant of one of the roots

571

# and we haven't already been marked as an ancestor

571

# and we haven't already been marked as an ancestor

572

ancestors.add(n) # Mark as ancestor

572

ancestors.add(n) # Mark as ancestor

573

# Add non-nullid parents to list of nodes to tag.

573

# Add non-nullid parents to list of nodes to tag.

574

nodestotag.update([p for p in self.parents(n) if

574

nodestotag.update([p for p in self.parents(n) if

575

p != nullid])

575

p != nullid])

576

elif n in heads: # We've seen it before, is it a fake head?

576

elif n in heads: # We've seen it before, is it a fake head?

577

# So it is, real heads should not be the ancestors of

577

# So it is, real heads should not be the ancestors of

578

# any other heads.

578

# any other heads.

579

heads.pop(n)

579

heads.pop(n)

580

if not ancestors:

580

if not ancestors:

581

return nonodes

581

return nonodes

582

# Now that we have our set of ancestors, we want to remove any

582

# Now that we have our set of ancestors, we want to remove any

583

# roots that are not ancestors.

583

# roots that are not ancestors.

584

585

# If one of the roots was nullid, everything is included anyway.

585

# If one of the roots was nullid, everything is included anyway.

586

if lowestrev > nullrev:

586

if lowestrev > nullrev:

587

# But, since we weren't, let's recompute the lowest rev to not

587

# But, since we weren't, let's recompute the lowest rev to not

588

# include roots that aren't ancestors.

588

# include roots that aren't ancestors.

589

590

# Filter out roots that aren't ancestors of heads

590

# Filter out roots that aren't ancestors of heads

591

roots = [n for n in roots if n in ancestors]

591

roots = [n for n in roots if n in ancestors]

592

# Recompute the lowest revision

592

# Recompute the lowest revision

593

if roots:

593

if roots:

594

lowestrev = min([self.rev(n) for n in roots])

594

lowestrev = min([self.rev(n) for n in roots])

595

else:

595

else:

596

# No more roots? Return empty list

596

# No more roots? Return empty list

597

return nonodes

597

return nonodes

598

else:

598

else:

599

# We are descending from nullid, and don't need to care about

599

# We are descending from nullid, and don't need to care about

600

# any other roots.

600

# any other roots.

601

lowestrev = nullrev

601

lowestrev = nullrev

602

roots = [nullid]

602

roots = [nullid]

603

# Transform our roots list into a set.

603

# Transform our roots list into a set.

604

descendants = set(roots)

604

descendants = set(roots)

605

# Also, keep the original roots so we can filter out roots that aren't

605

# Also, keep the original roots so we can filter out roots that aren't

606

# 'real' roots (i.e. are descended from other roots).

606

# 'real' roots (i.e. are descended from other roots).

607

roots = descendants.copy()

607

roots = descendants.copy()

608

# Our topologically sorted list of output nodes.

608

# Our topologically sorted list of output nodes.

609

orderedout = []

609

orderedout = []

610

# Don't start at nullid since we don't want nullid in our output list,

610

# Don't start at nullid since we don't want nullid in our output list,

611

# and if nullid shows up in descendants, empty parents will look like

611

# and if nullid shows up in descendants, empty parents will look like

612

# they're descendants.

612

# they're descendants.

613

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

613

for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):

614

n = self.node(r)

614

n = self.node(r)

615

isdescendant = False

615

isdescendant = False

616

if lowestrev == nullrev: # Everybody is a descendant of nullid

616

if lowestrev == nullrev: # Everybody is a descendant of nullid

617

isdescendant = True

617

isdescendant = True

618

elif n in descendants:

618

elif n in descendants:

619

# n is already a descendant

619

# n is already a descendant

620

isdescendant = True

620

isdescendant = True

621

# This check only needs to be done here because all the roots

621

# This check only needs to be done here because all the roots

622

# will start being marked is descendants before the loop.

622

# will start being marked is descendants before the loop.

623

if n in roots:

623

if n in roots:

624

# If n was a root, check if it's a 'real' root.

624

# If n was a root, check if it's a 'real' root.

625

p = tuple(self.parents(n))

625

p = tuple(self.parents(n))

626

# If any of its parents are descendants, it's not a root.

626

# If any of its parents are descendants, it's not a root.

627

if (p[0] in descendants) or (p[1] in descendants):

627

if (p[0] in descendants) or (p[1] in descendants):

628

roots.remove(n)

628

roots.remove(n)

629

else:

629

else:

630

p = tuple(self.parents(n))

630

p = tuple(self.parents(n))

631

# A node is a descendant if either of its parents are

631

# A node is a descendant if either of its parents are

632

# descendants. (We seeded the dependents list with the roots

632

# descendants. (We seeded the dependents list with the roots

633

# up there, remember?)

633

# up there, remember?)

634

if (p[0] in descendants) or (p[1] in descendants):

634

if (p[0] in descendants) or (p[1] in descendants):

635

descendants.add(n)

635

descendants.add(n)

636

isdescendant = True

636

isdescendant = True

637

if isdescendant and ((ancestors is None) or (n in ancestors)):

637

if isdescendant and ((ancestors is None) or (n in ancestors)):

638

# Only include nodes that are both descendants and ancestors.

638

# Only include nodes that are both descendants and ancestors.

639

orderedout.append(n)

639

orderedout.append(n)

640

if (ancestors is not None) and (n in heads):

640

if (ancestors is not None) and (n in heads):

641

# We're trying to figure out which heads are reachable

641

# We're trying to figure out which heads are reachable

642

# from roots.

642

# from roots.

643

# Mark this head as having been reached

643

# Mark this head as having been reached

644

heads[n] = True

644

heads[n] = True

645

elif ancestors is None:

645

elif ancestors is None:

646

# Otherwise, we're trying to discover the heads.

646

# Otherwise, we're trying to discover the heads.

647

# Assume this is a head because if it isn't, the next step

647

# Assume this is a head because if it isn't, the next step

648

# will eventually remove it.

648

# will eventually remove it.

649

heads[n] = True

649

heads[n] = True

650

# But, obviously its parents aren't.

650

# But, obviously its parents aren't.

651

for p in self.parents(n):

651

for p in self.parents(n):

652

heads.pop(p, None)

652

heads.pop(p, None)

653

heads = [n for n, flag in heads.iteritems() if flag]

653

heads = [n for n, flag in heads.iteritems() if flag]

654

roots = list(roots)

654

roots = list(roots)

655

assert orderedout

655

assert orderedout

656

assert roots

656

assert roots

657

assert heads

657

assert heads

658

return (orderedout, roots, heads)

658

return (orderedout, roots, heads)

659

660

def headrevs(self):

660

def headrevs(self):

661

try:

661

try:

662

return self.index.headrevs()

662

return self.index.headrevs()

663

except AttributeError:

663

except AttributeError:

664

return self._headrevs()

664

return self._headrevs()

665

666

def _headrevs(self):

666

def _headrevs(self):

667

count = len(self)

667

count = len(self)

668

if not count:

668

if not count:

669

return [nullrev]

669

return [nullrev]

670

# we won't iter over filtered rev so nobody is a head at start

670

# we won't iter over filtered rev so nobody is a head at start

671

ishead = [0] * (count + 1)

671

ishead = [0] * (count + 1)

672

index = self.index

672

index = self.index

673

for r in self:

673

for r in self:

674

ishead[r] = 1 # I may be an head

674

ishead[r] = 1 # I may be an head

675

e = index[r]

675

e = index[r]

676

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

676

ishead[e[5]] = ishead[e[6]] = 0 # my parent are not

677

return [r for r, val in enumerate(ishead) if val]

677

return [r for r, val in enumerate(ishead) if val]

678

679

def heads(self, start=None, stop=None):

679

def heads(self, start=None, stop=None):

680

"""return the list of all nodes that have no children

680

"""return the list of all nodes that have no children

681

682

if start is specified, only heads that are descendants of

682

if start is specified, only heads that are descendants of

683

start will be returned

683

start will be returned

684

if stop is specified, it will consider all the revs from stop

684

if stop is specified, it will consider all the revs from stop

685

as if they had no children

685

as if they had no children

686

"""

686

"""

687

if start is None and stop is None:

687

if start is None and stop is None:

688

if not len(self):

688

if not len(self):

689

return [nullid]

689

return [nullid]

690

return [self.node(r) for r in self.headrevs()]

690

return [self.node(r) for r in self.headrevs()]

691

692

if start is None:

692

if start is None:

693

start = nullid

693

start = nullid

694

if stop is None:

694

if stop is None:

695

stop = []

695

stop = []

696

stoprevs = set([self.rev(n) for n in stop])

696

stoprevs = set([self.rev(n) for n in stop])

697

startrev = self.rev(start)

697

startrev = self.rev(start)

698

reachable = set((startrev,))

698

reachable = set((startrev,))

699

heads = set((startrev,))

699

heads = set((startrev,))

700

701

parentrevs = self.parentrevs

701

parentrevs = self.parentrevs

702

for r in self.revs(start=startrev + 1):

702

for r in self.revs(start=startrev + 1):

703

for p in parentrevs(r):

703

for p in parentrevs(r):

704

if p in reachable:

704

if p in reachable:

705

if r not in stoprevs:

705

if r not in stoprevs:

706

reachable.add(r)

706

reachable.add(r)

707

heads.add(r)

707

heads.add(r)

708

if p in heads and p not in stoprevs:

708

if p in heads and p not in stoprevs:

709

heads.remove(p)

709

heads.remove(p)

710

711

return [self.node(r) for r in heads]

711

return [self.node(r) for r in heads]

712

713

def children(self, node):

713

def children(self, node):

714

"""find the children of a given node"""

714

"""find the children of a given node"""

715

c = []

715

c = []

716

p = self.rev(node)

716

p = self.rev(node)

717

for r in self.revs(start=p + 1):

717

for r in self.revs(start=p + 1):

718

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

718

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

719

if prevs:

719

if prevs:

720

for pr in prevs:

720

for pr in prevs:

721

if pr == p:

721

if pr == p:

722

c.append(self.node(r))

722

c.append(self.node(r))

723

elif p == nullrev:

723

elif p == nullrev:

724

c.append(self.node(r))

724

c.append(self.node(r))

725

return c

725

return c

726

727

def descendant(self, start, end):

727

def descendant(self, start, end):

728

if start == nullrev:

728

if start == nullrev:

729

return True

729

return True

730

for i in self.descendants([start]):

730

for i in self.descendants([start]):

731

if i == end:

731

if i == end:

732

return True

732

return True

733

elif i > end:

733

elif i > end:

734

break

734

break

735

return False

735

return False

736

737

def commonancestorsheads(self, a, b):

737

def commonancestorsheads(self, a, b):

738

"""calculate all the heads of the common ancestors of nodes a and b"""

738

"""calculate all the heads of the common ancestors of nodes a and b"""

739

a, b = self.rev(a), self.rev(b)

739

a, b = self.rev(a), self.rev(b)

740

try:

740

try:

741

ancs = self.index.commonancestorsheads(a, b)

741

ancs = self.index.commonancestorsheads(a, b)

742

except (AttributeError, OverflowError): # C implementation failed

742

except (AttributeError, OverflowError): # C implementation failed

743

ancs = ancestor.commonancestorsheads(self.parentrevs, a, b)

743

ancs = ancestor.commonancestorsheads(self.parentrevs, a, b)

744

return map(self.node, ancs)

744

return map(self.node, ancs)

745

746

def ~~common~~ancestors(self, a, b):

746

def ancestor(self, a, b):

747

"""calculate the least common ancestors of nodes a and b"""

747

"""calculate the least common ancestor of nodes a and b"""

748

a, b = self.rev(a), self.rev(b)

749

a, b = self.rev(a), self.rev(b)

749

try:

750

try:

750

ancs = self.index.ancestors(a, b)

751

ancs = self.index.ancestors(a, b)

751

except (AttributeError, OverflowError): ~~# C implementation failed~~

752

except (AttributeError, OverflowError):

752

ancs = ancestor.ancestors(self.parentrevs, a, b)

753

ancs = ancestor.ancestors(self.parentrevs, a, b)

753

return map(self.node, ancs)

754

755

def ancestor(self, a, b):

756

"""calculate a least common ancestor of nodes a and b"""

757

ancs = self.commonancestors(a, b)

758

if ancs:

754

if ancs:

759

# choose a consistent winner when there's a tie

755

# choose a consistent winner when there's a tie

760

return min(ancs)

756

return min(map(self.node, ancs))

761

return nullid

757

return nullid

762

758

763

def _match(self, id):

759

def _match(self, id):

764

if isinstance(id, int):

760

if isinstance(id, int):

765

# rev

761

# rev

766

return self.node(id)

762

return self.node(id)

767

if len(id) == 20:

763

if len(id) == 20:

768

# possibly a binary node

764

# possibly a binary node

769

# odds of a binary node being all hex in ASCII are 1 in 10**25

765

# odds of a binary node being all hex in ASCII are 1 in 10**25

770

try:

766

try:

771

node = id

767

node = id

772

self.rev(node) # quick search the index

768

self.rev(node) # quick search the index

773

return node

769

return node

774

except LookupError:

770

except LookupError:

775

pass # may be partial hex id

771

pass # may be partial hex id

776

try:

772

try:

777

# str(rev)

773

# str(rev)

778

rev = int(id)

774

rev = int(id)

779

if str(rev) != id:

775

if str(rev) != id:

780

raise ValueError

776

raise ValueError

781

if rev < 0:

777

if rev < 0:

782

rev = len(self) + rev

778

rev = len(self) + rev

783

if rev < 0 or rev >= len(self):

779

if rev < 0 or rev >= len(self):

784

raise ValueError

780

raise ValueError

785

return self.node(rev)

781

return self.node(rev)

786

except (ValueError, OverflowError):

782

except (ValueError, OverflowError):

787

pass

783

pass

788

if len(id) == 40:

784

if len(id) == 40:

789

try:

785

try:

790

# a full hex nodeid?

786

# a full hex nodeid?

791

node = bin(id)

787

node = bin(id)

792

self.rev(node)

788

self.rev(node)

793

return node

789

return node

794

except (TypeError, LookupError):

790

except (TypeError, LookupError):

795

pass

791

pass

796

792

797

def _partialmatch(self, id):

793

def _partialmatch(self, id):

798

try:

794

try:

799

n = self.index.partialmatch(id)

795

n = self.index.partialmatch(id)

800

if n and self.hasnode(n):

796

if n and self.hasnode(n):

801

return n

797

return n

802

return None

798

return None

803

except RevlogError:

799

except RevlogError:

804

# parsers.c radix tree lookup gave multiple matches

800

# parsers.c radix tree lookup gave multiple matches

805

# fall through to slow path that filters hidden revisions

801

# fall through to slow path that filters hidden revisions

806

pass

802

pass

807

except (AttributeError, ValueError):

803

except (AttributeError, ValueError):

808

# we are pure python, or key was too short to search radix tree

804

# we are pure python, or key was too short to search radix tree

809

pass

805

pass

810

806

811

if id in self._pcache:

807

if id in self._pcache:

812

return self._pcache[id]

808

return self._pcache[id]

813

809

814

if len(id) < 40:

810

if len(id) < 40:

815

try:

811

try:

816

# hex(node)[:...]

812

# hex(node)[:...]

817

l = len(id) // 2 # grab an even number of digits

813

l = len(id) // 2 # grab an even number of digits

818

prefix = bin(id[:l * 2])

814

prefix = bin(id[:l * 2])

819

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

815

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

820

nl = [n for n in nl if hex(n).startswith(id) and

816

nl = [n for n in nl if hex(n).startswith(id) and

821

self.hasnode(n)]

817

self.hasnode(n)]

822

if len(nl) > 0:

818

if len(nl) > 0:

823

if len(nl) == 1:

819

if len(nl) == 1:

824

self._pcache[id] = nl[0]

820

self._pcache[id] = nl[0]

825

return nl[0]

821

return nl[0]

826

raise LookupError(id, self.indexfile,

822

raise LookupError(id, self.indexfile,

827

_('ambiguous identifier'))

823

_('ambiguous identifier'))

828

return None

824

return None

829

except TypeError:

825

except TypeError:

830

pass

826

pass

831

827

832

def lookup(self, id):

828

def lookup(self, id):

833

"""locate a node based on:

829

"""locate a node based on:

834

- revision number or str(revision number)

830

- revision number or str(revision number)

835

- nodeid or subset of hex nodeid

831

- nodeid or subset of hex nodeid

836

"""

832

"""

837

n = self._match(id)

833

n = self._match(id)

838

if n is not None:

834

if n is not None:

839

return n

835

return n

840

n = self._partialmatch(id)

836

n = self._partialmatch(id)

841

if n:

837

if n:

842

return n

838

return n

843

839

844

raise LookupError(id, self.indexfile, _('no match found'))

840

raise LookupError(id, self.indexfile, _('no match found'))

845

841

846

def cmp(self, node, text):

842

def cmp(self, node, text):

847

"""compare text with a given file revision

843

"""compare text with a given file revision

848

844

849

returns True if text is different than what is stored.

845

returns True if text is different than what is stored.

850

"""

846

"""

851

p1, p2 = self.parents(node)

847

p1, p2 = self.parents(node)

852

return hash(text, p1, p2) != node

848

return hash(text, p1, p2) != node

853

849

854

def _addchunk(self, offset, data):

850

def _addchunk(self, offset, data):

855

o, d = self._chunkcache

851

o, d = self._chunkcache

856

# try to add to existing cache

852

# try to add to existing cache

857

if o + len(d) == offset and len(d) + len(data) < _chunksize:

853

if o + len(d) == offset and len(d) + len(data) < _chunksize:

858

self._chunkcache = o, d + data

854

self._chunkcache = o, d + data

859

else:

855

else:

860

self._chunkcache = offset, data

856

self._chunkcache = offset, data

861

857

862

def _loadchunk(self, offset, length):

858

def _loadchunk(self, offset, length):

863

if self._inline:

859

if self._inline:

864

df = self.opener(self.indexfile)

860

df = self.opener(self.indexfile)

865

else:

861

else:

866

df = self.opener(self.datafile)

862

df = self.opener(self.datafile)

867

863

868

# Cache data both forward and backward around the requested

864

# Cache data both forward and backward around the requested

869

# data, in a fixed size window. This helps speed up operations

865

# data, in a fixed size window. This helps speed up operations

870

# involving reading the revlog backwards.

866

# involving reading the revlog backwards.

871

cachesize = self._chunkcachesize

867

cachesize = self._chunkcachesize

872

realoffset = offset & ~(cachesize - 1)

868

realoffset = offset & ~(cachesize - 1)

873

reallength = (((offset + length + cachesize) & ~(cachesize - 1))

869

reallength = (((offset + length + cachesize) & ~(cachesize - 1))

874

- realoffset)

870

- realoffset)

875

df.seek(realoffset)

871

df.seek(realoffset)

876

d = df.read(reallength)

872

d = df.read(reallength)

877

df.close()

873

df.close()

878

self._addchunk(realoffset, d)

874

self._addchunk(realoffset, d)

879

if offset != realoffset or reallength != length:

875

if offset != realoffset or reallength != length:

880

return util.buffer(d, offset - realoffset, length)

876

return util.buffer(d, offset - realoffset, length)

881

return d

877

return d

882

878

883

def _getchunk(self, offset, length):

879

def _getchunk(self, offset, length):

884

o, d = self._chunkcache

880

o, d = self._chunkcache

885

l = len(d)

881

l = len(d)

886

882

887

# is it in the cache?

883

# is it in the cache?

888

cachestart = offset - o

884

cachestart = offset - o

889

cacheend = cachestart + length

885

cacheend = cachestart + length

890

if cachestart >= 0 and cacheend <= l:

886

if cachestart >= 0 and cacheend <= l:

891

if cachestart == 0 and cacheend == l:

887

if cachestart == 0 and cacheend == l:

892

return d # avoid a copy

888

return d # avoid a copy

893

return util.buffer(d, cachestart, cacheend - cachestart)

889

return util.buffer(d, cachestart, cacheend - cachestart)

894

890

895

return self._loadchunk(offset, length)

891

return self._loadchunk(offset, length)

896

892

897

def _chunkraw(self, startrev, endrev):

893

def _chunkraw(self, startrev, endrev):

898

start = self.start(startrev)

894

start = self.start(startrev)

899

end = self.end(endrev)

895

end = self.end(endrev)

900

if self._inline:

896

if self._inline:

901

start += (startrev + 1) * self._io.size

897

start += (startrev + 1) * self._io.size

902

end += (endrev + 1) * self._io.size

898

end += (endrev + 1) * self._io.size

903

length = end - start

899

length = end - start

904

return self._getchunk(start, length)

900

return self._getchunk(start, length)

905

901

906

def _chunk(self, rev):

902

def _chunk(self, rev):

907

return decompress(self._chunkraw(rev, rev))

903

return decompress(self._chunkraw(rev, rev))

908

904

909

def _chunks(self, revs):

905

def _chunks(self, revs):

910

'''faster version of [self._chunk(rev) for rev in revs]

906

'''faster version of [self._chunk(rev) for rev in revs]

911

907

912

Assumes that revs is in ascending order.'''

908

Assumes that revs is in ascending order.'''

913

if not revs:

909

if not revs:

914

return []

910

return []

915

start = self.start

911

start = self.start

916

length = self.length

912

length = self.length

917

inline = self._inline

913

inline = self._inline

918

iosize = self._io.size

914

iosize = self._io.size

919

buffer = util.buffer

915

buffer = util.buffer

920

916

921

l = []

917

l = []

922

ladd = l.append

918

ladd = l.append

923

919

924

# preload the cache

920

# preload the cache

925

try:

921

try:

926

self._chunkraw(revs[0], revs[-1])

922

self._chunkraw(revs[0], revs[-1])

927

offset, data = self._chunkcache

923

offset, data = self._chunkcache

928

except OverflowError:

924

except OverflowError:

929

# issue4215 - we can't cache a run of chunks greater than

925

# issue4215 - we can't cache a run of chunks greater than

930

# 2G on Windows

926

# 2G on Windows

931

return [self._chunk(rev) for rev in revs]

927

return [self._chunk(rev) for rev in revs]

932

928

933

for rev in revs:

929

for rev in revs:

934

chunkstart = start(rev)

930

chunkstart = start(rev)

935

if inline:

931

if inline:

936

chunkstart += (rev + 1) * iosize

932

chunkstart += (rev + 1) * iosize

937

chunklength = length(rev)

933

chunklength = length(rev)

938

ladd(decompress(buffer(data, chunkstart - offset, chunklength)))

934

ladd(decompress(buffer(data, chunkstart - offset, chunklength)))

939

935

940

return l

936

return l

941

937

942

def _chunkclear(self):

938

def _chunkclear(self):

943

self._chunkcache = (0, '')

939

self._chunkcache = (0, '')

944

940

945

def deltaparent(self, rev):

941

def deltaparent(self, rev):

946

"""return deltaparent of the given revision"""

942

"""return deltaparent of the given revision"""

947

base = self.index[rev][3]

943

base = self.index[rev][3]

948

if base == rev:

944

if base == rev:

949

return nullrev

945

return nullrev

950

elif self._generaldelta:

946

elif self._generaldelta:

951

return base

947

return base

952

else:

948

else:

953

return rev - 1

949

return rev - 1

954

950

955

def revdiff(self, rev1, rev2):

951

def revdiff(self, rev1, rev2):

956

"""return or calculate a delta between two revisions"""

952

"""return or calculate a delta between two revisions"""

957

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

953

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

958

return str(self._chunk(rev2))

954

return str(self._chunk(rev2))

959

955

960

return mdiff.textdiff(self.revision(rev1),

956

return mdiff.textdiff(self.revision(rev1),

961

self.revision(rev2))

957

self.revision(rev2))

962

958

963

def revision(self, nodeorrev):

959

def revision(self, nodeorrev):

964

"""return an uncompressed revision of a given node or revision

960

"""return an uncompressed revision of a given node or revision

965

number.

961

number.

966

"""

962

"""

967

if isinstance(nodeorrev, int):

963

if isinstance(nodeorrev, int):

968

rev = nodeorrev

964

rev = nodeorrev

969

node = self.node(rev)

965

node = self.node(rev)

970

else:

966

else:

971

node = nodeorrev

967

node = nodeorrev

972

rev = None

968

rev = None

973

969

974

cachedrev = None

970

cachedrev = None

975

if node == nullid:

971

if node == nullid:

976

return ""

972

return ""

977

if self._cache:

973

if self._cache:

978

if self._cache[0] == node:

974

if self._cache[0] == node:

979

return self._cache[2]

975

return self._cache[2]

980

cachedrev = self._cache[1]

976

cachedrev = self._cache[1]

981

977

982

# look up what we need to read

978

# look up what we need to read

983

text = None

979

text = None

984

if rev is None:

980

if rev is None:

985

rev = self.rev(node)

981

rev = self.rev(node)

986

982

987

# check rev flags

983

# check rev flags

988

if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:

984

if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:

989

raise RevlogError(_('incompatible revision flag %x') %

985

raise RevlogError(_('incompatible revision flag %x') %

990

(self.flags(rev) & ~REVIDX_KNOWN_FLAGS))

986

(self.flags(rev) & ~REVIDX_KNOWN_FLAGS))

991

987

992

# build delta chain

988

# build delta chain

993

chain = []

989

chain = []

994

index = self.index # for performance

990

index = self.index # for performance

995

generaldelta = self._generaldelta

991

generaldelta = self._generaldelta

996

iterrev = rev

992

iterrev = rev

997

e = index[iterrev]

993

e = index[iterrev]

998

while iterrev != e[3] and iterrev != cachedrev:

994

while iterrev != e[3] and iterrev != cachedrev:

999

chain.append(iterrev)

995

chain.append(iterrev)

1000

if generaldelta:

996

if generaldelta:

1001

iterrev = e[3]

997

iterrev = e[3]

1002

else:

998

else:

1003

iterrev -= 1

999

iterrev -= 1

1004

e = index[iterrev]

1000

e = index[iterrev]

1005

1001

1006

if iterrev == cachedrev:

1002

if iterrev == cachedrev:

1007

# cache hit

1003

# cache hit

1008

text = self._cache[2]

1004

text = self._cache[2]

1009

else:

1005

else:

1010

chain.append(iterrev)

1006

chain.append(iterrev)

1011

chain.reverse()

1007

chain.reverse()

1012

1008

1013

# drop cache to save memory

1009

# drop cache to save memory

1014

self._cache = None

1010

self._cache = None

1015

1011

1016

bins = self._chunks(chain)

1012

bins = self._chunks(chain)

1017

if text is None:

1013

if text is None:

1018

text = str(bins[0])

1014

text = str(bins[0])

1019

bins = bins[1:]

1015

bins = bins[1:]

1020

1016

1021

text = mdiff.patches(text, bins)

1017

text = mdiff.patches(text, bins)

1022

1018

1023

text = self._checkhash(text, node, rev)

1019

text = self._checkhash(text, node, rev)

1024

1020

1025

self._cache = (node, rev, text)

1021

self._cache = (node, rev, text)

1026

return text

1022

return text

1027

1023

1028

def _checkhash(self, text, node, rev):

1024

def _checkhash(self, text, node, rev):

1029

p1, p2 = self.parents(node)

1025

p1, p2 = self.parents(node)

1030

self.checkhash(text, p1, p2, node, rev)

1026

self.checkhash(text, p1, p2, node, rev)

1031

return text

1027

return text

1032

1028

1033

def checkhash(self, text, p1, p2, node, rev=None):

1029

def checkhash(self, text, p1, p2, node, rev=None):

1034

if node != hash(text, p1, p2):

1030

if node != hash(text, p1, p2):

1035

revornode = rev

1031

revornode = rev

1036

if revornode is None:

1032

if revornode is None:

1037

revornode = templatefilters.short(hex(node))

1033

revornode = templatefilters.short(hex(node))

1038

raise RevlogError(_("integrity check failed on %s:%s")

1034

raise RevlogError(_("integrity check failed on %s:%s")

1039

% (self.indexfile, revornode))

1035

% (self.indexfile, revornode))

1040

1036

1041

def checkinlinesize(self, tr, fp=None):

1037

def checkinlinesize(self, tr, fp=None):

1042

if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:

1038

if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:

1043

return

1039

return

1044

1040

1045

trinfo = tr.find(self.indexfile)

1041

trinfo = tr.find(self.indexfile)

1046

if trinfo is None:

1042

if trinfo is None:

1047

raise RevlogError(_("%s not found in the transaction")

1043

raise RevlogError(_("%s not found in the transaction")

1048

% self.indexfile)

1044

% self.indexfile)

1049

1045

1050

trindex = trinfo[2]

1046

trindex = trinfo[2]

1051

dataoff = self.start(trindex)

1047

dataoff = self.start(trindex)

1052

1048

1053

tr.add(self.datafile, dataoff)

1049

tr.add(self.datafile, dataoff)

1054

1050

1055

if fp:

1051

if fp:

1056

fp.flush()

1052

fp.flush()

1057

fp.close()

1053

fp.close()

1058

1054

1059

df = self.opener(self.datafile, 'w')

1055

df = self.opener(self.datafile, 'w')

1060

try:

1056

try:

1061

for r in self:

1057

for r in self:

1062

df.write(self._chunkraw(r, r))

1058

df.write(self._chunkraw(r, r))

1063

finally:

1059

finally:

1064

df.close()

1060

df.close()

1065

1061

1066

fp = self.opener(self.indexfile, 'w', atomictemp=True)

1062

fp = self.opener(self.indexfile, 'w', atomictemp=True)

1067

self.version &= ~(REVLOGNGINLINEDATA)

1063

self.version &= ~(REVLOGNGINLINEDATA)

1068

self._inline = False

1064

self._inline = False

1069

for i in self:

1065

for i in self:

1070

e = self._io.packentry(self.index[i], self.node, self.version, i)

1066

e = self._io.packentry(self.index[i], self.node, self.version, i)

1071

fp.write(e)

1067

fp.write(e)

1072

1068

1073

# if we don't call close, the temp file will never replace the

1069

# if we don't call close, the temp file will never replace the

1074

# real index

1070

# real index

1075

fp.close()

1071

fp.close()

1076

1072

1077

tr.replace(self.indexfile, trindex * self._io.size)

1073

tr.replace(self.indexfile, trindex * self._io.size)

1078

self._chunkclear()

1074

self._chunkclear()

1079

1075

1080

def addrevision(self, text, transaction, link, p1, p2, cachedelta=None,

1076

def addrevision(self, text, transaction, link, p1, p2, cachedelta=None,

1081

node=None):

1077

node=None):

1082

"""add a revision to the log

1078

"""add a revision to the log

1083

1079

1084

text - the revision data to add

1080

text - the revision data to add

1085

transaction - the transaction object used for rollback

1081

transaction - the transaction object used for rollback

1086

link - the linkrev data to add

1082

link - the linkrev data to add

1087

p1, p2 - the parent nodeids of the revision

1083

p1, p2 - the parent nodeids of the revision

1088

cachedelta - an optional precomputed delta

1084

cachedelta - an optional precomputed delta

1089

node - nodeid of revision; typically node is not specified, and it is

1085

node - nodeid of revision; typically node is not specified, and it is

1090

computed by default as hash(text, p1, p2), however subclasses might

1086

computed by default as hash(text, p1, p2), however subclasses might

1091

use different hashing method (and override checkhash() in such case)

1087

use different hashing method (and override checkhash() in such case)

1092

"""

1088

"""

1093

if link == nullrev:

1089

if link == nullrev:

1094

raise RevlogError(_("attempted to add linkrev -1 to %s")

1090

raise RevlogError(_("attempted to add linkrev -1 to %s")

1095

% self.indexfile)

1091

% self.indexfile)

1096

node = node or hash(text, p1, p2)

1092

node = node or hash(text, p1, p2)

1097

if node in self.nodemap:

1093

if node in self.nodemap:

1098

return node

1094

return node

1099

1095

1100

dfh = None

1096

dfh = None

1101

if not self._inline:

1097

if not self._inline:

1102

dfh = self.opener(self.datafile, "a")

1098

dfh = self.opener(self.datafile, "a")

1103

ifh = self.opener(self.indexfile, "a+")

1099

ifh = self.opener(self.indexfile, "a+")

1104

try:

1100

try:

1105

return self._addrevision(node, text, transaction, link, p1, p2,

1101

return self._addrevision(node, text, transaction, link, p1, p2,

1106

cachedelta, ifh, dfh)

1102

cachedelta, ifh, dfh)

1107

finally:

1103

finally:

1108

if dfh:

1104

if dfh:

1109

dfh.close()

1105

dfh.close()

1110

ifh.close()

1106

ifh.close()

1111

1107

1112

def compress(self, text):

1108

def compress(self, text):

1113

""" generate a possibly-compressed representation of text """

1109

""" generate a possibly-compressed representation of text """

1114

if not text:

1110

if not text:

1115

return ("", text)

1111

return ("", text)

1116

l = len(text)

1112

l = len(text)

1117

bin = None

1113

bin = None

1118

if l < 44:

1114

if l < 44:

1119

pass

1115

pass

1120

elif l > 1000000:

1116

elif l > 1000000:

1121

# zlib makes an internal copy, thus doubling memory usage for

1117

# zlib makes an internal copy, thus doubling memory usage for

1122

# large files, so lets do this in pieces

1118

# large files, so lets do this in pieces

1123

z = zlib.compressobj()

1119

z = zlib.compressobj()

1124

p = []

1120

p = []

1125

pos = 0

1121

pos = 0

1126

while pos < l:

1122

while pos < l:

1127

pos2 = pos + 2**20

1123

pos2 = pos + 2**20

1128

p.append(z.compress(text[pos:pos2]))

1124

p.append(z.compress(text[pos:pos2]))

1129

pos = pos2

1125

pos = pos2

1130

p.append(z.flush())

1126

p.append(z.flush())

1131

if sum(map(len, p)) < l:

1127

if sum(map(len, p)) < l:

1132

bin = "".join(p)

1128

bin = "".join(p)

1133

else:

1129

else:

1134

bin = _compress(text)

1130

bin = _compress(text)

1135

if bin is None or len(bin) > l:

1131

if bin is None or len(bin) > l:

1136

if text[0] == '\0':

1132

if text[0] == '\0':

1137

return ("", text)

1133

return ("", text)

1138

return ('u', text)

1134

return ('u', text)

1139

return ("", bin)

1135

return ("", bin)

1140

1136

1141

def _addrevision(self, node, text, transaction, link, p1, p2,

1137

def _addrevision(self, node, text, transaction, link, p1, p2,

1142

cachedelta, ifh, dfh):

1138

cachedelta, ifh, dfh):

1143

"""internal function to add revisions to the log

1139

"""internal function to add revisions to the log

1144

1140

1145

see addrevision for argument descriptions.

1141

see addrevision for argument descriptions.

1146

invariants:

1142

invariants:

1147

- text is optional (can be None); if not set, cachedelta must be set.

1143

- text is optional (can be None); if not set, cachedelta must be set.

1148

if both are set, they must correspond to each other.

1144

if both are set, they must correspond to each other.

1149

"""

1145

"""

1150

btext = [text]

1146

btext = [text]

1151

def buildtext():

1147

def buildtext():

1152

if btext[0] is not None:

1148

if btext[0] is not None:

1153

return btext[0]

1149

return btext[0]

1154

# flush any pending writes here so we can read it in revision

1150

# flush any pending writes here so we can read it in revision

1155

if dfh:

1151

if dfh:

1156

dfh.flush()

1152

dfh.flush()

1157

ifh.flush()

1153

ifh.flush()

1158

basetext = self.revision(self.node(cachedelta[0]))

1154

basetext = self.revision(self.node(cachedelta[0]))

1159

btext[0] = mdiff.patch(basetext, cachedelta[1])

1155

btext[0] = mdiff.patch(basetext, cachedelta[1])

1160

self.checkhash(btext[0], p1, p2, node)

1156

self.checkhash(btext[0], p1, p2, node)

1161

return btext[0]

1157

return btext[0]

1162

1158

1163

def builddelta(rev):

1159

def builddelta(rev):

1164

# can we use the cached delta?

1160

# can we use the cached delta?

1165

if cachedelta and cachedelta[0] == rev:

1161

if cachedelta and cachedelta[0] == rev:

1166

delta = cachedelta[1]

1162

delta = cachedelta[1]

1167

else:

1163

else:

1168

t = buildtext()

1164

t = buildtext()

1169

ptext = self.revision(self.node(rev))

1165

ptext = self.revision(self.node(rev))

1170

delta = mdiff.textdiff(ptext, t)

1166

delta = mdiff.textdiff(ptext, t)

1171

data = self.compress(delta)

1167

data = self.compress(delta)

1172

l = len(data[1]) + len(data[0])

1168

l = len(data[1]) + len(data[0])

1173

if basecache[0] == rev:

1169

if basecache[0] == rev:

1174

chainbase = basecache[1]

1170

chainbase = basecache[1]

1175

else:

1171

else:

1176

chainbase = self.chainbase(rev)

1172

chainbase = self.chainbase(rev)

1177

dist = l + offset - self.start(chainbase)

1173

dist = l + offset - self.start(chainbase)

1178

if self._generaldelta:

1174

if self._generaldelta:

1179

base = rev

1175

base = rev

1180

else:

1176

else:

1181

base = chainbase

1177

base = chainbase

1182

return dist, l, data, base, chainbase

1178

return dist, l, data, base, chainbase

1183

1179

1184

curr = len(self)

1180

curr = len(self)

1185

prev = curr - 1

1181

prev = curr - 1

1186

base = chainbase = curr

1182

base = chainbase = curr

1187

offset = self.end(prev)

1183

offset = self.end(prev)

1188

flags = 0

1184

flags = 0

1189

d = None

1185

d = None

1190

if self._basecache is None:

1186

if self._basecache is None:

1191

self._basecache = (prev, self.chainbase(prev))

1187

self._basecache = (prev, self.chainbase(prev))

1192

basecache = self._basecache

1188

basecache = self._basecache

1193

p1r, p2r = self.rev(p1), self.rev(p2)

1189

p1r, p2r = self.rev(p1), self.rev(p2)

1194

1190

1195

# should we try to build a delta?

1191

# should we try to build a delta?

1196

if prev != nullrev:

1192

if prev != nullrev:

1197

if self._generaldelta:

1193

if self._generaldelta:

1198

if p1r >= basecache[1]:

1194

if p1r >= basecache[1]:

1199

d = builddelta(p1r)

1195

d = builddelta(p1r)

1200

elif p2r >= basecache[1]:

1196

elif p2r >= basecache[1]:

1201

d = builddelta(p2r)

1197

d = builddelta(p2r)

1202

else:

1198

else:

1203

d = builddelta(prev)

1199

d = builddelta(prev)

1204

else:

1200

else:

1205

d = builddelta(prev)

1201

d = builddelta(prev)

1206

dist, l, data, base, chainbase = d

1202

dist, l, data, base, chainbase = d

1207

1203

1208

# full versions are inserted when the needed deltas

1204

# full versions are inserted when the needed deltas

1209

# become comparable to the uncompressed text

1205

# become comparable to the uncompressed text

1210

if text is None:

1206

if text is None:

1211

textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),

1207

textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),

1212

cachedelta[1])

1208

cachedelta[1])

1213

else:

1209

else:

1214

textlen = len(text)

1210

textlen = len(text)

1215

if d is None or dist > textlen * 2:

1211

if d is None or dist > textlen * 2:

1216

text = buildtext()

1212

text = buildtext()

1217

data = self.compress(text)

1213

data = self.compress(text)

1218

l = len(data[1]) + len(data[0])

1214

l = len(data[1]) + len(data[0])

1219

base = chainbase = curr

1215

base = chainbase = curr

1220

1216

1221

e = (offset_type(offset, flags), l, textlen,

1217

e = (offset_type(offset, flags), l, textlen,

1222

base, link, p1r, p2r, node)

1218

base, link, p1r, p2r, node)

1223

self.index.insert(-1, e)

1219

self.index.insert(-1, e)

1224

self.nodemap[node] = curr

1220

self.nodemap[node] = curr

1225

1221

1226

entry = self._io.packentry(e, self.node, self.version, curr)

1222

entry = self._io.packentry(e, self.node, self.version, curr)

1227

self._writeentry(transaction, ifh, dfh, entry, data, link, offset)

1223

self._writeentry(transaction, ifh, dfh, entry, data, link, offset)

1228

1224

1229

if type(text) == str: # only accept immutable objects

1225

if type(text) == str: # only accept immutable objects

1230

self._cache = (node, curr, text)

1226

self._cache = (node, curr, text)

1231

self._basecache = (curr, chainbase)

1227

self._basecache = (curr, chainbase)

1232

return node

1228

return node

1233

1229

1234

def _writeentry(self, transaction, ifh, dfh, entry, data, link, offset):

1230

def _writeentry(self, transaction, ifh, dfh, entry, data, link, offset):

1235

curr = len(self) - 1

1231

curr = len(self) - 1

1236

if not self._inline:

1232

if not self._inline:

1237

transaction.add(self.datafile, offset)

1233

transaction.add(self.datafile, offset)

1238

transaction.add(self.indexfile, curr * len(entry))

1234

transaction.add(self.indexfile, curr * len(entry))

1239

if data[0]:

1235

if data[0]:

1240

dfh.write(data[0])

1236

dfh.write(data[0])

1241

dfh.write(data[1])

1237

dfh.write(data[1])

1242

dfh.flush()

1238

dfh.flush()

1243

ifh.write(entry)

1239

ifh.write(entry)

1244

else:

1240

else:

1245

offset += curr * self._io.size

1241

offset += curr * self._io.size

1246

transaction.add(self.indexfile, offset, curr)

1242

transaction.add(self.indexfile, offset, curr)

1247

ifh.write(entry)

1243

ifh.write(entry)

1248

ifh.write(data[0])

1244

ifh.write(data[0])

1249

ifh.write(data[1])

1245

ifh.write(data[1])

1250

self.checkinlinesize(transaction, ifh)

1246

self.checkinlinesize(transaction, ifh)

1251

1247

1252

def addgroup(self, bundle, linkmapper, transaction):

1248

def addgroup(self, bundle, linkmapper, transaction):

1253

"""

1249

"""

1254

add a delta group

1250

add a delta group

1255

1251

1256

given a set of deltas, add them to the revision log. the

1252

given a set of deltas, add them to the revision log. the

1257

first delta is against its parent, which should be in our

1253

first delta is against its parent, which should be in our

1258

log, the rest are against the previous delta.

1254

log, the rest are against the previous delta.

1259

"""

1255

"""

1260

1256

1261

# track the base of the current delta log

1257

# track the base of the current delta log

1262

content = []

1258

content = []

1263

node = None

1259

node = None

1264

1260

1265

r = len(self)

1261

r = len(self)

1266

end = 0

1262

end = 0

1267

if r:

1263

if r:

1268

end = self.end(r - 1)

1264

end = self.end(r - 1)

1269

ifh = self.opener(self.indexfile, "a+")

1265

ifh = self.opener(self.indexfile, "a+")

1270

isize = r * self._io.size

1266

isize = r * self._io.size

1271

if self._inline:

1267

if self._inline:

1272

transaction.add(self.indexfile, end + isize, r)

1268

transaction.add(self.indexfile, end + isize, r)

1273

dfh = None

1269

dfh = None

1274

else:

1270

else:

1275

transaction.add(self.indexfile, isize, r)

1271

transaction.add(self.indexfile, isize, r)

1276

transaction.add(self.datafile, end)

1272

transaction.add(self.datafile, end)

1277

dfh = self.opener(self.datafile, "a")

1273

dfh = self.opener(self.datafile, "a")

1278

1274

1279

try:

1275

try:

1280

# loop through our set of deltas

1276

# loop through our set of deltas

1281

chain = None

1277

chain = None

1282

while True:

1278

while True:

1283

chunkdata = bundle.deltachunk(chain)

1279

chunkdata = bundle.deltachunk(chain)

1284

if not chunkdata:

1280

if not chunkdata:

1285

break

1281

break

1286

node = chunkdata['node']

1282

node = chunkdata['node']

1287

p1 = chunkdata['p1']

1283

p1 = chunkdata['p1']

1288

p2 = chunkdata['p2']

1284

p2 = chunkdata['p2']

1289

cs = chunkdata['cs']

1285

cs = chunkdata['cs']

1290

deltabase = chunkdata['deltabase']

1286

deltabase = chunkdata['deltabase']

1291

delta = chunkdata['delta']

1287

delta = chunkdata['delta']

1292

1288

1293

content.append(node)

1289

content.append(node)

1294

1290

1295

link = linkmapper(cs)

1291

link = linkmapper(cs)

1296

if node in self.nodemap:

1292

if node in self.nodemap:

1297

# this can happen if two branches make the same change

1293

# this can happen if two branches make the same change

1298

chain = node

1294

chain = node

1299

continue

1295

continue

1300

1296

1301

for p in (p1, p2):

1297

for p in (p1, p2):

1302

if p not in self.nodemap:

1298

if p not in self.nodemap:

1303

raise LookupError(p, self.indexfile,

1299

raise LookupError(p, self.indexfile,

1304

_('unknown parent'))

1300

_('unknown parent'))

1305

1301

1306

if deltabase not in self.nodemap:

1302

if deltabase not in self.nodemap:

1307

raise LookupError(deltabase, self.indexfile,

1303

raise LookupError(deltabase, self.indexfile,

1308

_('unknown delta base'))

1304

_('unknown delta base'))

1309

1305

1310

baserev = self.rev(deltabase)

1306

baserev = self.rev(deltabase)

1311

chain = self._addrevision(node, None, transaction, link,

1307

chain = self._addrevision(node, None, transaction, link,

1312

p1, p2, (baserev, delta), ifh, dfh)

1308

p1, p2, (baserev, delta), ifh, dfh)

1313

if not dfh and not self._inline:

1309

if not dfh and not self._inline:

1314

# addrevision switched from inline to conventional

1310

# addrevision switched from inline to conventional

1315

# reopen the index

1311

# reopen the index

1316

ifh.close()

1312

ifh.close()

1317

dfh = self.opener(self.datafile, "a")

1313

dfh = self.opener(self.datafile, "a")

1318

ifh = self.opener(self.indexfile, "a")

1314

ifh = self.opener(self.indexfile, "a")

1319

finally:

1315

finally:

1320

if dfh:

1316

if dfh:

1321

dfh.close()

1317

dfh.close()

1322

ifh.close()

1318

ifh.close()

1323

1319

1324

return content

1320

return content

1325

1321

1326

def getstrippoint(self, minlink):

1322

def getstrippoint(self, minlink):

1327

"""find the minimum rev that must be stripped to strip the linkrev

1323

"""find the minimum rev that must be stripped to strip the linkrev

1328

1324

1329

Returns a tuple containing the minimum rev and a set of all revs that

1325

Returns a tuple containing the minimum rev and a set of all revs that

1330

have linkrevs that will be broken by this strip.

1326

have linkrevs that will be broken by this strip.

1331

"""

1327

"""

1332

brokenrevs = set()

1328

brokenrevs = set()

1333

strippoint = len(self)

1329

strippoint = len(self)

1334

1330

1335

heads = {}

1331

heads = {}

1336

futurelargelinkrevs = set()

1332

futurelargelinkrevs = set()

1337

for head in self.headrevs():

1333

for head in self.headrevs():

1338

headlinkrev = self.linkrev(head)

1334

headlinkrev = self.linkrev(head)

1339

heads[head] = headlinkrev

1335

heads[head] = headlinkrev

1340

if headlinkrev >= minlink:

1336

if headlinkrev >= minlink:

1341

futurelargelinkrevs.add(headlinkrev)

1337

futurelargelinkrevs.add(headlinkrev)

1342

1338

1343

# This algorithm involves walking down the rev graph, starting at the

1339

# This algorithm involves walking down the rev graph, starting at the

1344

# heads. Since the revs are topologically sorted according to linkrev,

1340

# heads. Since the revs are topologically sorted according to linkrev,

1345

# once all head linkrevs are below the minlink, we know there are

1341

# once all head linkrevs are below the minlink, we know there are

1346

# no more revs that could have a linkrev greater than minlink.

1342

# no more revs that could have a linkrev greater than minlink.

1347

# So we can stop walking.

1343

# So we can stop walking.

1348

while futurelargelinkrevs:

1344

while futurelargelinkrevs:

1349

strippoint -= 1

1345

strippoint -= 1

1350

linkrev = heads.pop(strippoint)

1346

linkrev = heads.pop(strippoint)

1351

1347

1352

if linkrev < minlink:

1348

if linkrev < minlink:

1353

brokenrevs.add(strippoint)

1349

brokenrevs.add(strippoint)

1354

else:

1350

else:

1355

futurelargelinkrevs.remove(linkrev)

1351

futurelargelinkrevs.remove(linkrev)

1356

1352

1357

for p in self.parentrevs(strippoint):

1353

for p in self.parentrevs(strippoint):

1358

if p != nullrev:

1354

if p != nullrev:

1359

plinkrev = self.linkrev(p)

1355

plinkrev = self.linkrev(p)

1360

heads[p] = plinkrev

1356

heads[p] = plinkrev

1361

if plinkrev >= minlink:

1357

if plinkrev >= minlink:

1362

futurelargelinkrevs.add(plinkrev)

1358

futurelargelinkrevs.add(plinkrev)

1363

1359

1364

return strippoint, brokenrevs

1360

return strippoint, brokenrevs

1365

1361

1366

def strip(self, minlink, transaction):

1362

def strip(self, minlink, transaction):

1367

"""truncate the revlog on the first revision with a linkrev >= minlink

1363

"""truncate the revlog on the first revision with a linkrev >= minlink

1368

1364

1369

This function is called when we're stripping revision minlink and

1365

This function is called when we're stripping revision minlink and

1370

its descendants from the repository.

1366

its descendants from the repository.

1371

1367

1372

We have to remove all revisions with linkrev >= minlink, because

1368

We have to remove all revisions with linkrev >= minlink, because

1373

the equivalent changelog revisions will be renumbered after the

1369

the equivalent changelog revisions will be renumbered after the

1374

strip.

1370

strip.

1375

1371

1376

So we truncate the revlog on the first of these revisions, and

1372

So we truncate the revlog on the first of these revisions, and

1377

trust that the caller has saved the revisions that shouldn't be

1373

trust that the caller has saved the revisions that shouldn't be

1378

removed and that it'll re-add them after this truncation.

1374

removed and that it'll re-add them after this truncation.

1379

"""

1375

"""

1380

if len(self) == 0:

1376

if len(self) == 0:

1381

return

1377

return

1382

1378

1383

rev, _ = self.getstrippoint(minlink)

1379

rev, _ = self.getstrippoint(minlink)

1384

if rev == len(self):

1380

if rev == len(self):

1385

return

1381

return

1386

1382

1387

# first truncate the files on disk

1383

# first truncate the files on disk

1388

end = self.start(rev)

1384

end = self.start(rev)

1389

if not self._inline:

1385

if not self._inline:

1390

transaction.add(self.datafile, end)

1386

transaction.add(self.datafile, end)

1391

end = rev * self._io.size

1387

end = rev * self._io.size

1392

else:

1388

else:

1393

end += rev * self._io.size

1389

end += rev * self._io.size

1394

1390

1395

transaction.add(self.indexfile, end)

1391

transaction.add(self.indexfile, end)

1396

1392

1397

# then reset internal state in memory to forget those revisions

1393

# then reset internal state in memory to forget those revisions

1398

self._cache = None

1394

self._cache = None

1399

self._chunkclear()

1395

self._chunkclear()

1400

for x in xrange(rev, len(self)):

1396

for x in xrange(rev, len(self)):

1401

del self.nodemap[self.node(x)]

1397

del self.nodemap[self.node(x)]

1402

1398

1403

del self.index[rev:-1]

1399

del self.index[rev:-1]

1404

1400

1405

def checksize(self):

1401

def checksize(self):

1406

expected = 0

1402

expected = 0

1407

if len(self):

1403

if len(self):

1408

expected = max(0, self.end(len(self) - 1))

1404

expected = max(0, self.end(len(self) - 1))

1409

1405

1410

try:

1406

try:

1411

f = self.opener(self.datafile)

1407

f = self.opener(self.datafile)

1412

f.seek(0, 2)

1408

f.seek(0, 2)

1413

actual = f.tell()

1409

actual = f.tell()

1414

f.close()

1410

f.close()

1415

dd = actual - expected

1411

dd = actual - expected

1416

except IOError, inst:

1412

except IOError, inst:

1417

if inst.errno != errno.ENOENT:

1413

if inst.errno != errno.ENOENT:

1418

raise

1414

raise

1419

dd = 0

1415

dd = 0

1420

1416

1421

try:

1417

try:

1422

f = self.opener(self.indexfile)

1418

f = self.opener(self.indexfile)

1423

f.seek(0, 2)

1419

f.seek(0, 2)

1424

actual = f.tell()

1420

actual = f.tell()

1425

f.close()

1421

f.close()

1426

s = self._io.size

1422

s = self._io.size

1427

i = max(0, actual // s)

1423

i = max(0, actual // s)

1428

di = actual - (i * s)

1424

di = actual - (i * s)

1429

if self._inline:

1425

if self._inline:

1430

databytes = 0

1426

databytes = 0

1431

for r in self:

1427

for r in self:

1432

databytes += max(0, self.length(r))

1428

databytes += max(0, self.length(r))

1433

dd = 0

1429

dd = 0

1434

di = actual - len(self) * s - databytes

1430

di = actual - len(self) * s - databytes

1435

except IOError, inst:

1431

except IOError, inst:

1436

if inst.errno != errno.ENOENT:

1432

if inst.errno != errno.ENOENT:

1437

raise

1433

raise

1438

di = 0

1434

di = 0

1439

1435

1440

return (dd, di)

1436

return (dd, di)

1441

1437

1442

def files(self):

1438

def files(self):

1443

res = [self.indexfile]

1439

res = [self.indexfile]

1444

if not self._inline:

1440

if not self._inline:

1445

res.append(self.datafile)

1441

res.append(self.datafile)

1446

return res

1442

return res

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # revlog.py - storage back-end for mercurial
             #
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             # import stuff from node for others to import from revlog
             from node import bin, hex, nullid, nullrev
             from i18n import _
             import ancestor, mdiff, parsers, error, util, templatefilters
             import struct, zlib, errno
             _pack = struct.pack
             _unpack = struct.unpack
             _compress = zlib.compress
             _decompress = zlib.decompress
             _sha = util.sha1
             # revlog header flags
             REVLOGV0 = 0
             REVLOGNG = 1
             REVLOGNGINLINEDATA = (1 << 16)
             REVLOGGENERALDELTA = (1 << 17)
             REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA
             REVLOG_DEFAULT_FORMAT = REVLOGNG
             REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS
             REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGGENERALDELTA
             # revlog index flags
             REVIDX_KNOWN_FLAGS = 0
             # max size of revlog with inline data
             _maxinline = 131072
             _chunksize = 1048576
             RevlogError = error.RevlogError
             LookupError = error.LookupError
             def getoffset(q):
                 return int(q >> 16)
             def gettype(q):
                 return int(q & 0xFFFF)
             def offset_type(offset, type):
                 return long(long(offset) << 16 | type)
             nullhash = _sha(nullid)
             def hash(text, p1, p2):
                 """generate a hash from the given text and its parent hashes
                 This hash combines both the current file contents and its history
                 in a manner that makes it easy to distinguish nodes with the same
                 content in the revision graph.
                 """
                 # As of now, if one of the parent node is null, p2 is null
                 if p2 == nullid:
                     # deep copy of a hash is faster than creating one
                     s = nullhash.copy()
                     s.update(p1)
                 else:
                     # none of the parent nodes are nullid
                     l = [p1, p2]
                     l.sort()
                     s = _sha(l[0])
                     s.update(l[1])
                 s.update(text)
                 return s.digest()
             def decompress(bin):
                 """ decompress the given input """
                 if not bin:
                     return bin
                 t = bin[0]
                 if t == '\0':
                     return bin
                 if t == 'x':
                     try:
                         return _decompress(bin)
                     except zlib.error, e:
                         raise RevlogError(_("revlog decompress error: %s") % str(e))
                 if t == 'u':
                     return bin[1:]
                 raise RevlogError(_("unknown compression type %r") % t)
             # index v0:
             #  4 bytes: offset
             #  4 bytes: compressed length
             #  4 bytes: base rev
             #  4 bytes: link rev
             # 32 bytes: parent 1 nodeid
             # 32 bytes: parent 2 nodeid
             # 32 bytes: nodeid
             indexformatv0 = ">4l20s20s20s"
             v0shaoffset = 56
             class revlogoldio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatv0)
                 def parseindex(self, data, inline):
                     s = self.size
                     index = []
                     nodemap =  {nullid: nullrev}
                     n = off = 0
                     l = len(data)
                     while off + s <= l:
                         cur = data[off:off + s]
                         off += s
                         e = _unpack(indexformatv0, cur)
                         # transform to revlogv1 format
                         e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],
                               nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])
                         index.append(e2)
                         nodemap[e[6]] = n
                         n += 1
                     # add the magic null revision at -1
                     index.append((0, 0, 0, -1, -1, -1, -1, nullid))
                     return index, nodemap, None
                 def packentry(self, entry, node, version, rev):
                     if gettype(entry[0]):
                         raise RevlogError(_("index entry flags need RevlogNG"))
                     e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],
                           node(entry[5]), node(entry[6]), entry[7])
                     return _pack(indexformatv0, *e2)
             # index ng:
             #  6 bytes: offset
             #  2 bytes: flags
             #  4 bytes: compressed length
             #  4 bytes: uncompressed length
             #  4 bytes: base rev
             #  4 bytes: link rev
             #  4 bytes: parent 1 rev
             #  4 bytes: parent 2 rev
             # 32 bytes: nodeid
             indexformatng = ">Qiiiiii20s12x"
             ngshaoffset = 32
             versionformat = ">I"
             class revlogio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatng)
                 def parseindex(self, data, inline):
                     # call the C implementation to parse the index data
                     index, cache = parsers.parse_index2(data, inline)
                     return index, getattr(index, 'nodemap', None), cache
                 def packentry(self, entry, node, version, rev):
                     p = _pack(indexformatng, *entry)
                     if rev == 0:
                         p = _pack(versionformat, version) + p[4:]
                     return p
             class revlog(object):
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 """
                 def __init__(self, opener, indexfile):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     """
                     self.indexfile = indexfile
                     self.datafile = indexfile[:-2] + ".d"
                     self.opener = opener
                     self._cache = None
                     self._basecache = None
                     self._chunkcache = (0, '')
                     self._chunkcachesize = 65536
                     self.index = []
                     self._pcache = {}
                     self._nodecache = {nullid: nullrev}
                     self._nodepos = None
                     v = REVLOG_DEFAULT_VERSION
                     opts = getattr(opener, 'options', None)
                     if opts is not None:
                         if 'revlogv1' in opts:
                             if 'generaldelta' in opts:
                                 v |= REVLOGGENERALDELTA
                         else:
                             v = 0
                         if 'chunkcachesize' in opts:
                             self._chunkcachesize = opts['chunkcachesize']
                     if self._chunkcachesize <= 0:
                         raise RevlogError(_('revlog chunk cache size %r is not greater '
                                             'than 0') % self._chunkcachesize)
                     elif self._chunkcachesize & (self._chunkcachesize - 1):
                         raise RevlogError(_('revlog chunk cache size %r is not a power '
                                             'of 2') % self._chunkcachesize)
                     i = ''
                     self._initempty = True
                     try:
                         f = self.opener(self.indexfile)
                         i = f.read()
                         f.close()
                         if len(i) > 0:
                             v = struct.unpack(versionformat, i[:4])[0]
                             self._initempty = False
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                     self.version = v
                     self._inline = v & REVLOGNGINLINEDATA
                     self._generaldelta = v & REVLOGGENERALDELTA
                     flags = v & ~0xFFFF
                     fmt = v & 0xFFFF
                     if fmt == REVLOGV0 and flags:
                         raise RevlogError(_("index %s unknown flags %#04x for format v0")
                                           % (self.indexfile, flags >> 16))
                     elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:
                         raise RevlogError(_("index %s unknown flags %#04x for revlogng")
                                           % (self.indexfile, flags >> 16))
                     elif fmt > REVLOGNG:
                         raise RevlogError(_("index %s unknown format %d")
                                           % (self.indexfile, fmt))
                     self._io = revlogio()
                     if self.version == REVLOGV0:
                         self._io = revlogoldio()
                     try:
                         d = self._io.parseindex(i, self._inline)
                     except (ValueError, IndexError):
                         raise RevlogError(_("index %s is corrupted") % (self.indexfile))
                     self.index, nodemap, self._chunkcache = d
                     if nodemap is not None:
                         self.nodemap = self._nodecache = nodemap
                     if not self._chunkcache:
                         self._chunkclear()
                 def tip(self):
                     return self.node(len(self.index) - 2)
                 def __len__(self):
                     return len(self.index) - 1
                 def __iter__(self):
                     return iter(xrange(len(self)))
                 def revs(self, start=0, stop=None):
                     """iterate over all rev in this revlog (from start to stop)"""
                     step = 1
                     if stop is not None:
                         if start > stop:
                             step = -1
                         stop += step
                     else:
                         stop = len(self)
                     return xrange(start, stop, step)
                 @util.propertycache
                 def nodemap(self):
                     self.rev(self.node(0))
                     return self._nodecache
                 def hasnode(self, node):
                     try:
                         self.rev(node)
                         return True
                     except KeyError:
                         return False
                 def clearcaches(self):
                     try:
                         self._nodecache.clearcaches()
                     except AttributeError:
                         self._nodecache = {nullid: nullrev}
                         self._nodepos = None
                 def rev(self, node):
                     try:
                         return self._nodecache[node]
                     except RevlogError:
                         # parsers.c radix tree lookup failed
                         raise LookupError(node, self.indexfile, _('no node'))
                     except KeyError:
                         # pure python cache lookup failed
                         n = self._nodecache
                         i = self.index
                         p = self._nodepos
                         if p is None:
                             p = len(i) - 2
                         for r in xrange(p, -1, -1):
                             v = i[r][7]
                             n[v] = r
                             if v == node:
                                 self._nodepos = r - 1
                                 return r
                         raise LookupError(node, self.indexfile, _('no node'))
                 def node(self, rev):
                     return self.index[rev][7]
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline
                 def parentrevs(self, rev):
                     return self.index[rev][5:7]
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def length(self, rev):
                     return self.index[rev][1]
                 def chainbase(self, rev):
                     index = self.index
                     base = index[rev][3]
                     while base != rev:
                         rev = base
                         base = index[rev][3]
                     return base
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.revision(self.node(rev))
                     return len(t)
                 size = rawsize
                 def ancestors(self, revs, stoprev=0, inclusive=False):
                     """Generate the ancestors of 'revs' in reverse topological order.
                     Does not generate revs lower than stoprev.
                     See the documentation for ancestor.lazyancestors for more details."""
                     return ancestor.lazyancestors(self, revs, stoprev=stoprev,
                                                   inclusive=inclusive)
                 def descendants(self, revs):
                     """Generate the descendants of 'revs' in revision order.
                     Yield a sequence of revision numbers starting with a child of
                     some rev in revs, i.e., each revision is *not* considered a
                     descendant of itself.  Results are ordered by revision number (a
                     topological sort)."""
                     first = min(revs)
                     if first == nullrev:
                         for i in self:
                             yield i
                         return
                     seen = set(revs)
                     for i in self.revs(start=first + 1):
                         for x in self.parentrevs(i):
                             if x != nullrev and x in seen:
                                 seen.add(i)
                                 yield i
                                 break
                 def findcommonmissing(self, common=None, heads=None):
                     """Return a tuple of the ancestors of common and the ancestors of heads
                     that are not ancestors of common. In revset terminology, we return the
                     tuple:
                       ::common, (::heads) - (::common)
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     class lazyset(object):
                         def __init__(self, lazyvalues):
                             self.addedvalues = set()
                             self.lazyvalues = lazyvalues
                         def __contains__(self, value):
                             return value in self.addedvalues or value in self.lazyvalues
                         def __iter__(self):
                             added = self.addedvalues
                             for r in added:
                                 yield r
                             for r in self.lazyvalues:
                                 if not r in added:
                                     yield r
                         def add(self, value):
                             self.addedvalues.add(value)
                         def update(self, values):
                             self.addedvalues.update(values)
                     has = lazyset(self.ancestors(common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = util.deque(r for r in heads if r not in has)
                     while visit:
                         r = visit.popleft()
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return has, [self.node(r) for r in missing]
                 def findmissingrevs(self, common=None, heads=None):
                     """Return the revision numbers of the ancestors of heads that
                     are not ancestors of common.
                     More specifically, return a list of revision numbers corresponding to
                     nodes N such that every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of revision numbers.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullrev]
                     if heads is None:
                         heads = self.headrevs()
                     return ancestor.missingancestors(heads, common, self.parentrevs)
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     return [self.node(r) for r in
                             ancestor.missingancestors(heads, common, self.parentrevs)]
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [nullid] # Everybody's a descendant of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return ([self.node(r) for r in self], [nullid], list(self.heads()))
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, False)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendant of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n) # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update([p for p in self.parents(n) if
                                                        p != nullid])
                                 elif n in heads: # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [n for n in roots if n in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(n) for n in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [nullid]
                     # Transform our roots list into a set.
                     descendants = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendants.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descendants, empty parents will look like
                     # they're descendants.
                     for r in self.revs(start=max(lowestrev, 0), stop=highestrev + 1):
                         n = self.node(r)
                         isdescendant = False
                         if lowestrev == nullrev:  # Everybody is a descendant of nullid
                             isdescendant = True
                         elif n in descendants:
                             # n is already a descendant
                             isdescendant = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendants before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendants, it's not a root.
                                 if (p[0] in descendants) or (p[1] in descendants):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendant if either of its parents are
                             # descendants.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendants) or (p[1] in descendants):
                                 descendants.add(n)
                                 isdescendant = True
                         if isdescendant and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendants and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = True
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = True
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [n for n, flag in heads.iteritems() if flag]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def headrevs(self):
                     try:
                         return self.index.headrevs()
                     except AttributeError:
                         return self._headrevs()
                 def _headrevs(self):
                     count = len(self)
                     if not count:
                         return [nullrev]
                     # we won't iter over filtered rev so nobody is a head at start
                     ishead = [0] * (count + 1)
                     index = self.index
                     for r in self:
                         ishead[r] = 1  # I may be an head
                         e = index[r]
                         ishead[e[5]] = ishead[e[6]] = 0  # my parent are not
                     return [r for r, val in enumerate(ishead) if val]
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         if not len(self):
                             return [nullid]
                         return [self.node(r) for r in self.headrevs()]
                     if start is None:
                         start = nullid
                     if stop is None:
                         stop = []
                     stoprevs = set([self.rev(n) for n in stop])
                     startrev = self.rev(start)
                     reachable = set((startrev,))
                     heads = set((startrev,))
                     parentrevs = self.parentrevs
                     for r in self.revs(start=startrev + 1):
                         for p in parentrevs(r):
                             if p in reachable:
                                 if r not in stoprevs:
                                     reachable.add(r)
                                 heads.add(r)
                             if p in heads and p not in stoprevs:
                                 heads.remove(p)
                     return [self.node(r) for r in heads]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in self.revs(start=p + 1):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def descendant(self, start, end):
                     if start == nullrev:
                         return True
                     for i in self.descendants([start]):
                         if i == end:
                             return True
                         elif i > end:
                             break
                     return False
                 def commonancestorsheads(self, a, b):
                     """calculate all the heads of the common ancestors of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     try:
                         ancs = self.index.commonancestorsheads(a, b)
                     except (AttributeError, OverflowError): # C implementation failed
                         ancs = ancestor.commonancestorsheads(self.parentrevs, a, b)
                     return map(self.node, ancs)
-                def commonancestors(self, a, b):
+                def ancestor(self, a, b):
-                    """calculate the least common ancestors of nodes a and b"""
+                    """calculate the least common ancestor of nodes a and b"""
                     a, b = self.rev(a), self.rev(b)
                     try:
                         ancs = self.index.ancestors(a, b)
-                    except (AttributeError, OverflowError): # C implementation failed
+                    except (AttributeError, OverflowError):
                         ancs = ancestor.ancestors(self.parentrevs, a, b)
-                    return map(self.node, ancs)
-                def ancestor(self, a, b):
-                    """calculate a least common ancestor of nodes a and b"""
-                    ancs = self.commonancestors(a, b)
                     if ancs:
                         # choose a consistent winner when there's a tie
-                        return min(ancs)
+                        return min(map(self.node, ancs))
                     return nullid
                 def _match(self, id):
                     if isinstance(id, int):
                         # rev
                         return self.node(id)
                     if len(id) == 20:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node) # quick search the index
                             return node
                         except LookupError:
                             pass # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if str(rev) != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 40:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (TypeError, LookupError):
                             pass
                 def _partialmatch(self, id):
                     try:
                         n = self.index.partialmatch(id)
                         if n and self.hasnode(n):
                             return n
                         return None
                     except RevlogError:
                         # parsers.c radix tree lookup gave multiple matches
                         # fall through to slow path that filters hidden revisions
                         pass
                     except (AttributeError, ValueError):
                         # we are pure python, or key was too short to search radix tree
                         pass
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) < 40:
                         try:
                             # hex(node)[:...]
                             l = len(id) // 2  # grab an even number of digits
                             prefix = bin(id[:l * 2])
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [n for n in nl if hex(n).startswith(id) and
                                   self.hasnode(n)]
                             if len(nl) > 0:
                                 if len(nl) == 1:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise LookupError(id, self.indexfile,
                                                   _('ambiguous identifier'))
                             return None
                         except TypeError:
                             pass
                 def lookup(self, id):
                     """locate a node based on:
                         - revision number or str(revision number)
                         - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise LookupError(id, self.indexfile, _('no match found'))
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return hash(text, p1, p2) != node
                 def _addchunk(self, offset, data):
                     o, d = self._chunkcache
                     # try to add to existing cache
                     if o + len(d) == offset and len(d) + len(data) < _chunksize:
                         self._chunkcache = o, d + data
                     else:
                         self._chunkcache = offset, data
                 def _loadchunk(self, offset, length):
                     if self._inline:
                         df = self.opener(self.indexfile)
                     else:
                         df = self.opener(self.datafile)
                     # Cache data both forward and backward around the requested
                     # data, in a fixed size window. This helps speed up operations
                     # involving reading the revlog backwards.
                     cachesize = self._chunkcachesize
                     realoffset = offset & ~(cachesize - 1)
                     reallength = (((offset + length + cachesize) & ~(cachesize - 1))
                                   - realoffset)
                     df.seek(realoffset)
                     d = df.read(reallength)
                     df.close()
                     self._addchunk(realoffset, d)
                     if offset != realoffset or reallength != length:
                         return util.buffer(d, offset - realoffset, length)
                     return d
                 def _getchunk(self, offset, length):
                     o, d = self._chunkcache
                     l = len(d)
                     # is it in the cache?
                     cachestart = offset - o
                     cacheend = cachestart + length
                     if cachestart >= 0 and cacheend <= l:
                         if cachestart == 0 and cacheend == l:
                             return d # avoid a copy
                         return util.buffer(d, cachestart, cacheend - cachestart)
                     return self._loadchunk(offset, length)
                 def _chunkraw(self, startrev, endrev):
                     start = self.start(startrev)
                     end = self.end(endrev)
                     if self._inline:
                         start += (startrev + 1) * self._io.size
                         end += (endrev + 1) * self._io.size
                     length = end - start
                     return self._getchunk(start, length)
                 def _chunk(self, rev):
                     return decompress(self._chunkraw(rev, rev))
                 def _chunks(self, revs):
                     '''faster version of [self._chunk(rev) for rev in revs]
                     Assumes that revs is in ascending order.'''
                     if not revs:
                         return []
                     start = self.start
                     length = self.length
                     inline = self._inline
                     iosize = self._io.size
                     buffer = util.buffer
                     l = []
                     ladd = l.append
                     # preload the cache
                     try:
                         self._chunkraw(revs[0], revs[-1])
                         offset, data = self._chunkcache
                     except OverflowError:
                         # issue4215 - we can't cache a run of chunks greater than
                         # 2G on Windows
                         return [self._chunk(rev) for rev in revs]
                     for rev in revs:
                         chunkstart = start(rev)
                         if inline:
                             chunkstart += (rev + 1) * iosize
                         chunklength = length(rev)
                         ladd(decompress(buffer(data, chunkstart - offset, chunklength)))
                     return l
                 def _chunkclear(self):
                     self._chunkcache = (0, '')
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self._generaldelta:
                         return base
                     else:
                         return rev - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions"""
                     if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                         return str(self._chunk(rev2))
                     return mdiff.textdiff(self.revision(rev1),
                                           self.revision(rev2))
                 def revision(self, nodeorrev):
                     """return an uncompressed revision of a given node or revision
                     number.
                     """
                     if isinstance(nodeorrev, int):
                         rev = nodeorrev
                         node = self.node(rev)
                     else:
                         node = nodeorrev
                         rev = None
                     cachedrev = None
                     if node == nullid:
                         return ""
                     if self._cache:
                         if self._cache[0] == node:
                             return self._cache[2]
                         cachedrev = self._cache[1]
                     # look up what we need to read
                     text = None
                     if rev is None:
                         rev = self.rev(node)
                     # check rev flags
                     if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:
                         raise RevlogError(_('incompatible revision flag %x') %
                                           (self.flags(rev) & ~REVIDX_KNOWN_FLAGS))
                     # build delta chain
                     chain = []
                     index = self.index # for performance
                     generaldelta = self._generaldelta
                     iterrev = rev
                     e = index[iterrev]
                     while iterrev != e[3] and iterrev != cachedrev:
                         chain.append(iterrev)
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         e = index[iterrev]
                     if iterrev == cachedrev:
                         # cache hit
                         text = self._cache[2]
                     else:
                         chain.append(iterrev)
                     chain.reverse()
                     # drop cache to save memory
                     self._cache = None
                     bins = self._chunks(chain)
                     if text is None:
                         text = str(bins[0])
                         bins = bins[1:]
                     text = mdiff.patches(text, bins)
                     text = self._checkhash(text, node, rev)
                     self._cache = (node, rev, text)
                     return text
                 def _checkhash(self, text, node, rev):
                     p1, p2 = self.parents(node)
                     self.checkhash(text, p1, p2, node, rev)
                     return text
                 def checkhash(self, text, p1, p2, node, rev=None):
                     if node != hash(text, p1, p2):
                         revornode = rev
                         if revornode is None:
                             revornode = templatefilters.short(hex(node))
                         raise RevlogError(_("integrity check failed on %s:%s")
                             % (self.indexfile, revornode))
                 def checkinlinesize(self, tr, fp=None):
                     if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:
                         return
                     trinfo = tr.find(self.indexfile)
                     if trinfo is None:
                         raise RevlogError(_("%s not found in the transaction")
                                           % self.indexfile)
                     trindex = trinfo[2]
                     dataoff = self.start(trindex)
                     tr.add(self.datafile, dataoff)
                     if fp:
                         fp.flush()
                         fp.close()
                     df = self.opener(self.datafile, 'w')
                     try:
                         for r in self:
                             df.write(self._chunkraw(r, r))
                     finally:
                         df.close()
                     fp = self.opener(self.indexfile, 'w', atomictemp=True)
                     self.version &= ~(REVLOGNGINLINEDATA)
                     self._inline = False
                     for i in self:
                         e = self._io.packentry(self.index[i], self.node, self.version, i)
                         fp.write(e)
                     # if we don't call close, the temp file will never replace the
                     # real index
                     fp.close()
                     tr.replace(self.indexfile, trindex * self._io.size)
                     self._chunkclear()
                 def addrevision(self, text, transaction, link, p1, p2, cachedelta=None,
                                 node=None):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     node - nodeid of revision; typically node is not specified, and it is
                         computed by default as hash(text, p1, p2), however subclasses might
                         use different hashing method (and override checkhash() in such case)
                     """
                     if link == nullrev:
                         raise RevlogError(_("attempted to add linkrev -1 to %s")
                                           % self.indexfile)
                     node = node or hash(text, p1, p2)
                     if node in self.nodemap:
                         return node
                     dfh = None
                     if not self._inline:
                         dfh = self.opener(self.datafile, "a")
                     ifh = self.opener(self.indexfile, "a+")
                     try:
                         return self._addrevision(node, text, transaction, link, p1, p2,
                                                  cachedelta, ifh, dfh)
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                 def compress(self, text):
                     """ generate a possibly-compressed representation of text """
                     if not text:
                         return ("", text)
                     l = len(text)
                     bin = None
                     if l < 44:
                         pass
                     elif l > 1000000:
                         # zlib makes an internal copy, thus doubling memory usage for
                         # large files, so lets do this in pieces
                         z = zlib.compressobj()
                         p = []
                         pos = 0
                         while pos < l:
                             pos2 = pos + 2**20
                             p.append(z.compress(text[pos:pos2]))
                             pos = pos2
                         p.append(z.flush())
                         if sum(map(len, p)) < l:
                             bin = "".join(p)
                     else:
                         bin = _compress(text)
                     if bin is None or len(bin) > l:
                         if text[0] == '\0':
                             return ("", text)
                         return ('u', text)
                     return ("", bin)
                 def _addrevision(self, node, text, transaction, link, p1, p2,
                                  cachedelta, ifh, dfh):
                     """internal function to add revisions to the log
                     see addrevision for argument descriptions.
                     invariants:
                     - text is optional (can be None); if not set, cachedelta must be set.
                       if both are set, they must correspond to each other.
                     """
                     btext = [text]
                     def buildtext():
                         if btext[0] is not None:
                             return btext[0]
                         # flush any pending writes here so we can read it in revision
                         if dfh:
                             dfh.flush()
                         ifh.flush()
                         basetext = self.revision(self.node(cachedelta[0]))
                         btext[0] = mdiff.patch(basetext, cachedelta[1])
                         self.checkhash(btext[0], p1, p2, node)
                         return btext[0]
                     def builddelta(rev):
                         # can we use the cached delta?
                         if cachedelta and cachedelta[0] == rev:
                             delta = cachedelta[1]
                         else:
                             t = buildtext()
                             ptext = self.revision(self.node(rev))
                             delta = mdiff.textdiff(ptext, t)
                         data = self.compress(delta)
                         l = len(data[1]) + len(data[0])
                         if basecache[0] == rev:
                             chainbase = basecache[1]
                         else:
                             chainbase = self.chainbase(rev)
                         dist = l + offset - self.start(chainbase)
                         if self._generaldelta:
                             base = rev
                         else:
                             base = chainbase
                         return dist, l, data, base, chainbase
                     curr = len(self)
                     prev = curr - 1
                     base = chainbase = curr
                     offset = self.end(prev)
                     flags = 0
                     d = None
                     if self._basecache is None:
                         self._basecache = (prev, self.chainbase(prev))
                     basecache = self._basecache
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # should we try to build a delta?
                     if prev != nullrev:
                         if self._generaldelta:
                             if p1r >= basecache[1]:
                                 d = builddelta(p1r)
                             elif p2r >= basecache[1]:
                                 d = builddelta(p2r)
                             else:
                                 d = builddelta(prev)
                         else:
                             d = builddelta(prev)
                         dist, l, data, base, chainbase = d
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if text is None:
                         textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),
                                                     cachedelta[1])
                     else:
                         textlen = len(text)
                     if d is None or dist > textlen * 2:
                         text = buildtext()
                         data = self.compress(text)
                         l = len(data[1]) + len(data[0])
                         base = chainbase = curr
                     e = (offset_type(offset, flags), l, textlen,
                          base, link, p1r, p2r, node)
                     self.index.insert(-1, e)
                     self.nodemap[node] = curr
                     entry = self._io.packentry(e, self.node, self.version, curr)
                     self._writeentry(transaction, ifh, dfh, entry, data, link, offset)
                     if type(text) == str: # only accept immutable objects
                         self._cache = (node, curr, text)
                     self._basecache = (curr, chainbase)
                     return node
                 def _writeentry(self, transaction, ifh, dfh, entry, data, link, offset):
                     curr = len(self) - 1
                     if not self._inline:
                         transaction.add(self.datafile, offset)
                         transaction.add(self.indexfile, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         dfh.flush()
                         ifh.write(entry)
                     else:
                         offset += curr * self._io.size
                         transaction.add(self.indexfile, offset, curr)
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                         self.checkinlinesize(transaction, ifh)
                 def addgroup(self, bundle, linkmapper, transaction):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     """
                     # track the base of the current delta log
                     content = []
                     node = None
                     r = len(self)
                     end = 0
                     if r:
                         end = self.end(r - 1)
                     ifh = self.opener(self.indexfile, "a+")
                     isize = r * self._io.size
                     if self._inline:
                         transaction.add(self.indexfile, end + isize, r)
                         dfh = None
                     else:
                         transaction.add(self.indexfile, isize, r)
                         transaction.add(self.datafile, end)
                         dfh = self.opener(self.datafile, "a")
                     try:
                         # loop through our set of deltas
                         chain = None
                         while True:
                             chunkdata = bundle.deltachunk(chain)
                             if not chunkdata:
                                 break
                             node = chunkdata['node']
                             p1 = chunkdata['p1']
                             p2 = chunkdata['p2']
                             cs = chunkdata['cs']
                             deltabase = chunkdata['deltabase']
                             delta = chunkdata['delta']
                             content.append(node)
                             link = linkmapper(cs)
                             if node in self.nodemap:
                                 # this can happen if two branches make the same change
                                 chain = node
                                 continue
                             for p in (p1, p2):
                                 if p not in self.nodemap:
                                     raise LookupError(p, self.indexfile,
                                                       _('unknown parent'))
                             if deltabase not in self.nodemap:
                                 raise LookupError(deltabase, self.indexfile,
                                                   _('unknown delta base'))
                             baserev = self.rev(deltabase)
                             chain = self._addrevision(node, None, transaction, link,
                                                       p1, p2, (baserev, delta), ifh, dfh)
                             if not dfh and not self._inline:
                                 # addrevision switched from inline to conventional
                                 # reopen the index
                                 ifh.close()
                                 dfh = self.opener(self.datafile, "a")
                                 ifh = self.opener(self.indexfile, "a")
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                     return content
                 def getstrippoint(self, minlink):
                     """find the minimum rev that must be stripped to strip the linkrev
                     Returns a tuple containing the minimum rev and a set of all revs that
                     have linkrevs that will be broken by this strip.
                     """
                     brokenrevs = set()
                     strippoint = len(self)
                     heads = {}
                     futurelargelinkrevs = set()
                     for head in self.headrevs():
                         headlinkrev = self.linkrev(head)
                         heads[head] = headlinkrev
                         if headlinkrev >= minlink:
                             futurelargelinkrevs.add(headlinkrev)
                     # This algorithm involves walking down the rev graph, starting at the
                     # heads. Since the revs are topologically sorted according to linkrev,
                     # once all head linkrevs are below the minlink, we know there are
                     # no more revs that could have a linkrev greater than minlink.
                     # So we can stop walking.
                     while futurelargelinkrevs:
                         strippoint -= 1
                         linkrev = heads.pop(strippoint)
                         if linkrev < minlink:
                             brokenrevs.add(strippoint)
                         else:
                             futurelargelinkrevs.remove(linkrev)
                         for p in self.parentrevs(strippoint):
                             if p != nullrev:
                                 plinkrev = self.linkrev(p)
                                 heads[p] = plinkrev
                                 if plinkrev >= minlink:
                                     futurelargelinkrevs.add(plinkrev)
                     return strippoint, brokenrevs
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll re-add them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     rev, _ = self.getstrippoint(minlink)
                     if rev == len(self):
                         return
                     # first truncate the files on disk
                     end = self.start(rev)
                     if not self._inline:
                         transaction.add(self.datafile, end)
                         end = rev * self._io.size
                     else:
                         end += rev * self._io.size
                     transaction.add(self.indexfile, end)
                     # then reset internal state in memory to forget those revisions
                     self._cache = None
                     self._chunkclear()
                     for x in xrange(rev, len(self)):
                         del self.nodemap[self.node(x)]
                     del self.index[rev:-1]
                 def checksize(self):
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         f = self.opener(self.datafile)
                         f.seek(0, 2)
                         actual = f.tell()
                         f.close()
                         dd = actual - expected
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         dd = 0
                     try:
                         f = self.opener(self.indexfile)
                         f.seek(0, 2)
                         actual = f.tell()
                         f.close()
                         s = self._io.size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         di = 0
                     return (dd, di)
                 def files(self):
                     res = [self.indexfile]
                     if not self._inline:
                         res.append(self.datafile)
                     return res