upstream/mercurial-mirror Commit - r13276:ba6a6333

1

# revlog.py - storage back-end for mercurial

1

# revlog.py - storage back-end for mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

"""Storage back-end for Mercurial.

8

"""Storage back-end for Mercurial.

9

10

This provides efficient delta storage with O(1) retrieve and append

10

This provides efficient delta storage with O(1) retrieve and append

11

and O(changes) merge between branches.

11

and O(changes) merge between branches.

12

"""

12

"""

13

14

# import stuff from node for others to import from revlog

14

# import stuff from node for others to import from revlog

15

from node import bin, hex, nullid, nullrev, short #@UnusedImport

15

from node import bin, hex, nullid, nullrev, short #@UnusedImport

16

from i18n import _

16

from i18n import _

17

import changegroup, ancestor, mdiff, parsers, error, util

17

import changegroup, ancestor, mdiff, parsers, error, util

18

import struct, zlib, errno

18

import struct, zlib, errno

19

20

_pack = struct.pack

20

_pack = struct.pack

21

_unpack = struct.unpack

21

_unpack = struct.unpack

22

_compress = zlib.compress

22

_compress = zlib.compress

23

_decompress = zlib.decompress

23

_decompress = zlib.decompress

24

_sha = util.sha1

24

_sha = util.sha1

25

26

# revlog header flags

26

# revlog header flags

27

REVLOGV0 = 0

27

REVLOGV0 = 0

28

REVLOGNG = 1

28

REVLOGNG = 1

29

REVLOGNGINLINEDATA = (1 << 16)

29

REVLOGNGINLINEDATA = (1 << 16)

30

REVLOGSHALLOW = (1 << 17)

30

REVLOGSHALLOW = (1 << 17)

31

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

31

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

32

REVLOG_DEFAULT_FORMAT = REVLOGNG

32

REVLOG_DEFAULT_FORMAT = REVLOGNG

33

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

33

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

34

REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGSHALLOW

34

REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGSHALLOW

35

36

# revlog index flags

36

# revlog index flags

37

REVIDX_PARENTDELTA = 1

37

REVIDX_PARENTDELTA = 1

38

REVIDX_PUNCHED_FLAG = 2

38

REVIDX_PUNCHED_FLAG = 2

39

REVIDX_KNOWN_FLAGS = REVIDX_PUNCHED_FLAG | REVIDX_PARENTDELTA

39

REVIDX_KNOWN_FLAGS = REVIDX_PUNCHED_FLAG | REVIDX_PARENTDELTA

40

41

# max size of revlog with inline data

41

# max size of revlog with inline data

42

_maxinline = 131072

42

_maxinline = 131072

43

_chunksize = 1048576

43

_chunksize = 1048576

44

45

RevlogError = error.RevlogError

45

RevlogError = error.RevlogError

46

LookupError = error.LookupError

46

LookupError = error.LookupError

47

48

def getoffset(q):

48

def getoffset(q):

49

return int(q >> 16)

49

return int(q >> 16)

50

51

def gettype(q):

51

def gettype(q):

52

return int(q & 0xFFFF)

52

return int(q & 0xFFFF)

53

54

def offset_type(offset, type):

54

def offset_type(offset, type):

55

return long(long(offset) << 16 | type)

55

return long(long(offset) << 16 | type)

56

57

nullhash = _sha(nullid)

57

nullhash = _sha(nullid)

58

59

def hash(text, p1, p2):

59

def hash(text, p1, p2):

60

"""generate a hash from the given text and its parent hashes

60

"""generate a hash from the given text and its parent hashes

61

62

This hash combines both the current file contents and its history

62

This hash combines both the current file contents and its history

63

in a manner that makes it easy to distinguish nodes with the same

63

in a manner that makes it easy to distinguish nodes with the same

64

content in the revision graph.

64

content in the revision graph.

65

"""

65

"""

66

# As of now, if one of the parent node is null, p2 is null

66

# As of now, if one of the parent node is null, p2 is null

67

if p2 == nullid:

67

if p2 == nullid:

68

# deep copy of a hash is faster than creating one

68

# deep copy of a hash is faster than creating one

69

s = nullhash.copy()

69

s = nullhash.copy()

70

s.update(p1)

70

s.update(p1)

71

else:

71

else:

72

# none of the parent nodes are nullid

72

# none of the parent nodes are nullid

73

l = [p1, p2]

73

l = [p1, p2]

74

l.sort()

74

l.sort()

75

s = _sha(l[0])

75

s = _sha(l[0])

76

s.update(l[1])

76

s.update(l[1])

77

s.update(text)

77

s.update(text)

78

return s.digest()

78

return s.digest()

79

80

def compress(text):

80

def compress(text):

81

""" generate a possibly-compressed representation of text """

81

""" generate a possibly-compressed representation of text """

82

if not text:

82

if not text:

83

return ("", text)

83

return ("", text)

84

l = len(text)

84

l = len(text)

85

bin = None

85

bin = None

86

if l < 44:

86

if l < 44:

87

pass

87

pass

88

elif l > 1000000:

88

elif l > 1000000:

89

# zlib makes an internal copy, thus doubling memory usage for

89

# zlib makes an internal copy, thus doubling memory usage for

90

# large files, so lets do this in pieces

90

# large files, so lets do this in pieces

91

z = zlib.compressobj()

91

z = zlib.compressobj()

92

p = []

92

p = []

93

pos = 0

93

pos = 0

94

while pos < l:

94

while pos < l:

95

pos2 = pos + 2**20

95

pos2 = pos + 2**20

96

p.append(z.compress(text[pos:pos2]))

96

p.append(z.compress(text[pos:pos2]))

97

pos = pos2

97

pos = pos2

98

p.append(z.flush())

98

p.append(z.flush())

99

if sum(map(len, p)) < l:

99

if sum(map(len, p)) < l:

100

bin = "".join(p)

100

bin = "".join(p)

101

else:

101

else:

102

bin = _compress(text)

102

bin = _compress(text)

103

if bin is None or len(bin) > l:

103

if bin is None or len(bin) > l:

104

if text[0] == '\0':

104

if text[0] == '\0':

105

return ("", text)

105

return ("", text)

106

return ('u', text)

106

return ('u', text)

107

return ("", bin)

107

return ("", bin)

108

109

def decompress(bin):

109

def decompress(bin):

110

""" decompress the given input """

110

""" decompress the given input """

111

if not bin:

111

if not bin:

112

return bin

112

return bin

113

t = bin[0]

113

t = bin[0]

114

if t == '\0':

114

if t == '\0':

115

return bin

115

return bin

116

if t == 'x':

116

if t == 'x':

117

return _decompress(bin)

117

return _decompress(bin)

118

if t == 'u':

118

if t == 'u':

119

return bin[1:]

119

return bin[1:]

120

raise RevlogError(_("unknown compression type %r") % t)

120

raise RevlogError(_("unknown compression type %r") % t)

121

122

indexformatv0 = ">4l20s20s20s"

122

indexformatv0 = ">4l20s20s20s"

123

v0shaoffset = 56

123

v0shaoffset = 56

124

125

class revlogoldio(object):

125

class revlogoldio(object):

126

def __init__(self):

126

def __init__(self):

127

self.size = struct.calcsize(indexformatv0)

127

self.size = struct.calcsize(indexformatv0)

128

129

def parseindex(self, data, inline):

129

def parseindex(self, data, inline):

130

s = self.size

130

s = self.size

131

index = []

131

index = []

132

nodemap = {nullid: nullrev}

132

nodemap = {nullid: nullrev}

133

n = off = 0

133

n = off = 0

134

l = len(data)

134

l = len(data)

135

while off + s <= l:

135

while off + s <= l:

136

cur = data[off:off + s]

136

cur = data[off:off + s]

137

off += s

137

off += s

138

e = _unpack(indexformatv0, cur)

138

e = _unpack(indexformatv0, cur)

139

# transform to revlogv1 format

139

# transform to revlogv1 format

140

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

140

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

141

nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])

141

nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])

142

index.append(e2)

142

index.append(e2)

143

nodemap[e[6]] = n

143

nodemap[e[6]] = n

144

n += 1

144

n += 1

145

146

# add the magic null revision at -1

146

# add the magic null revision at -1

147

index.append((0, 0, 0, -1, -1, -1, -1, nullid))

147

index.append((0, 0, 0, -1, -1, -1, -1, nullid))

148

149

return index, nodemap, None

149

return index, nodemap, None

150

151

def packentry(self, entry, node, version, rev):

151

def packentry(self, entry, node, version, rev):

152

if gettype(entry[0]):

152

if gettype(entry[0]):

153

raise RevlogError(_("index entry flags need RevlogNG"))

153

raise RevlogError(_("index entry flags need RevlogNG"))

154

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

154

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

155

node(entry[5]), node(entry[6]), entry[7])

155

node(entry[5]), node(entry[6]), entry[7])

156

return _pack(indexformatv0, *e2)

156

return _pack(indexformatv0, *e2)

157

158

# index ng:

158

# index ng:

159

# 6 bytes: offset

159

# 6 bytes: offset

160

# 2 bytes: flags

160

# 2 bytes: flags

161

# 4 bytes: compressed length

161

# 4 bytes: compressed length

162

# 4 bytes: uncompressed length

162

# 4 bytes: uncompressed length

163

# 4 bytes: base rev

163

# 4 bytes: base rev

164

# 4 bytes: link rev

164

# 4 bytes: link rev

165

# 4 bytes: parent 1 rev

165

# 4 bytes: parent 1 rev

166

# 4 bytes: parent 2 rev

166

# 4 bytes: parent 2 rev

167

# 32 bytes: nodeid

167

# 32 bytes: nodeid

168

indexformatng = ">Qiiiiii20s12x"

168

indexformatng = ">Qiiiiii20s12x"

169

ngshaoffset = 32

169

ngshaoffset = 32

170

versionformat = ">I"

170

versionformat = ">I"

171

172

class revlogio(object):

172

class revlogio(object):

173

def __init__(self):

173

def __init__(self):

174

self.size = struct.calcsize(indexformatng)

174

self.size = struct.calcsize(indexformatng)

175

176

def parseindex(self, data, inline):

176

def parseindex(self, data, inline):

177

# call the C implementation to parse the index data

177

# call the C implementation to parse the index data

178

index, cache = parsers.parse_index2(data, inline)

178

index, cache = parsers.parse_index2(data, inline)

179

return index, None, cache

179

return index, None, cache

180

181

def packentry(self, entry, node, version, rev):

181

def packentry(self, entry, node, version, rev):

182

p = _pack(indexformatng, *entry)

182

p = _pack(indexformatng, *entry)

183

if rev == 0:

183

if rev == 0:

184

p = _pack(versionformat, version) + p[4:]

184

p = _pack(versionformat, version) + p[4:]

185

return p

185

return p

186

187

class revlog(object):

187

class revlog(object):

188

"""

188

"""

189

the underlying revision storage object

189

the underlying revision storage object

190

191

A revlog consists of two parts, an index and the revision data.

191

A revlog consists of two parts, an index and the revision data.

192

193

The index is a file with a fixed record size containing

193

The index is a file with a fixed record size containing

194

information on each revision, including its nodeid (hash), the

194

information on each revision, including its nodeid (hash), the

195

nodeids of its parents, the position and offset of its data within

195

nodeids of its parents, the position and offset of its data within

196

the data file, and the revision it's based on. Finally, each entry

196

the data file, and the revision it's based on. Finally, each entry

197

contains a linkrev entry that can serve as a pointer to external

197

contains a linkrev entry that can serve as a pointer to external

198

data.

198

data.

199

200

The revision data itself is a linear collection of data chunks.

200

The revision data itself is a linear collection of data chunks.

201

Each chunk represents a revision and is usually represented as a

201

Each chunk represents a revision and is usually represented as a

202

delta against the previous chunk. To bound lookup time, runs of

202

delta against the previous chunk. To bound lookup time, runs of

203

deltas are limited to about 2 times the length of the original

203

deltas are limited to about 2 times the length of the original

204

version data. This makes retrieval of a version proportional to

204

version data. This makes retrieval of a version proportional to

205

its size, or O(1) relative to the number of revisions.

205

its size, or O(1) relative to the number of revisions.

206

207

Both pieces of the revlog are written to in an append-only

207

Both pieces of the revlog are written to in an append-only

208

fashion, which means we never need to rewrite a file to insert or

208

fashion, which means we never need to rewrite a file to insert or

209

remove data, and can use some simple techniques to avoid the need

209

remove data, and can use some simple techniques to avoid the need

210

for locking while reading.

210

for locking while reading.

211

"""

211

"""

212

def __init__(self, opener, indexfile, shallowroot=None):

212

def __init__(self, opener, indexfile, shallowroot=None):

213

"""

213

"""

214

create a revlog object

214

create a revlog object

215

216

opener is a function that abstracts the file opening operation

216

opener is a function that abstracts the file opening operation

217

and can be used to implement COW semantics or the like.

217

and can be used to implement COW semantics or the like.

218

"""

218

"""

219

self.indexfile = indexfile

219

self.indexfile = indexfile

220

self.datafile = indexfile[:-2] + ".d"

220

self.datafile = indexfile[:-2] + ".d"

221

self.opener = opener

221

self.opener = opener

222

self._cache = None

222

self._cache = None

223

self._chunkcache = (0, '')

223

self._chunkcache = (0, '')

224

self.index = []

224

self.index = []

225

self._shallowroot = shallowroot

225

self._shallowroot = shallowroot

226

self._parentdelta = 0

226

self._parentdelta = 0

227

self._pcache = {}

227

self._pcache = {}

228

self._nodecache = {nullid: nullrev}

228

self._nodecache = {nullid: nullrev}

229

self._nodepos = None

229

self._nodepos = None

230

231

v = REVLOG_DEFAULT_VERSION

231

v = REVLOG_DEFAULT_VERSION

232

if hasattr(opener, 'options') and 'defversion' in opener.options:

232

if hasattr(opener, 'options') and 'defversion' in opener.options:

233

v = opener.options['defversion']

233

v = opener.options['defversion']

234

if v & REVLOGNG:

234

if v & REVLOGNG:

235

v |= REVLOGNGINLINEDATA

235

v |= REVLOGNGINLINEDATA

236

if v & REVLOGNG and 'parentdelta' in opener.options:

236

if v & REVLOGNG and 'parentdelta' in opener.options:

237

self._parentdelta = 1

237

self._parentdelta = 1

238

239

if shallowroot:

239

if shallowroot:

240

v |= REVLOGSHALLOW

240

v |= REVLOGSHALLOW

241

242

i = ''

242

i = ''

243

try:

243

try:

244

f = self.opener(self.indexfile)

244

f = self.opener(self.indexfile)

245

i = f.read()

245

i = f.read()

246

if len(i) > 0:

246

if len(i) > 0:

247

v = struct.unpack(versionformat, i[:4])[0]

247

v = struct.unpack(versionformat, i[:4])[0]

248

except IOError, inst:

248

except IOError, inst:

249

if inst.errno != errno.ENOENT:

249

if inst.errno != errno.ENOENT:

250

raise

250

raise

251

252

self.version = v

252

self.version = v

253

self._inline = v & REVLOGNGINLINEDATA

253

self._inline = v & REVLOGNGINLINEDATA

254

self._shallow = v & REVLOGSHALLOW

254

self._shallow = v & REVLOGSHALLOW

255

flags = v & ~0xFFFF

255

flags = v & ~0xFFFF

256

fmt = v & 0xFFFF

256

fmt = v & 0xFFFF

257

if fmt == REVLOGV0 and flags:

257

if fmt == REVLOGV0 and flags:

258

raise RevlogError(_("index %s unknown flags %#04x for format v0")

258

raise RevlogError(_("index %s unknown flags %#04x for format v0")

259

% (self.indexfile, flags >> 16))

259

% (self.indexfile, flags >> 16))

260

elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:

260

elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:

261

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

261

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

262

% (self.indexfile, flags >> 16))

262

% (self.indexfile, flags >> 16))

263

elif fmt > REVLOGNG:

263

elif fmt > REVLOGNG:

264

raise RevlogError(_("index %s unknown format %d")

264

raise RevlogError(_("index %s unknown format %d")

265

% (self.indexfile, fmt))

265

% (self.indexfile, fmt))

266

267

self._io = revlogio()

267

self._io = revlogio()

268

if self.version == REVLOGV0:

268

if self.version == REVLOGV0:

269

self._io = revlogoldio()

269

self._io = revlogoldio()

270

try:

270

try:

271

d = self._io.parseindex(i, self._inline)

271

d = self._io.parseindex(i, self._inline)

272

except (ValueError, IndexError):

272

except (ValueError, IndexError):

273

raise RevlogError(_("index %s is corrupted") % (self.indexfile))

273

raise RevlogError(_("index %s is corrupted") % (self.indexfile))

274

self.index, nodemap, self._chunkcache = d

274

self.index, nodemap, self._chunkcache = d

275

if nodemap is not None:

275

if nodemap is not None:

276

self.nodemap = self._nodecache = nodemap

276

self.nodemap = self._nodecache = nodemap

277

if not self._chunkcache:

277

if not self._chunkcache:

278

self._chunkclear()

278

self._chunkclear()

279

280

def tip(self):

280

def tip(self):

281

return self.node(len(self.index) - 2)

281

return self.node(len(self.index) - 2)

282

def __len__(self):

282

def __len__(self):

283

return len(self.index) - 1

283

return len(self.index) - 1

284

def __iter__(self):

284

def __iter__(self):

285

for i in xrange(len(self)):

285

for i in xrange(len(self)):

286

yield i

286

yield i

287

288

@util.propertycache

288

@util.propertycache

289

def nodemap(self):

289

def nodemap(self):

290

n = self.rev(self.node(0))

290

n = self.rev(self.node(0))

291

return self._nodecache

291

return self._nodecache

292

293

def rev(self, node):

293

def rev(self, node):

294

try:

294

try:

295

return self._nodecache[node]

295

return self._nodecache[node]

296

except KeyError:

296

except KeyError:

297

n = self._nodecache

297

n = self._nodecache

298

if node in n:

298

if node in n:

299

return n[node]

299

return n[node]

300

i = self.index

300

i = self.index

301

p = self._nodepos

301

p = self._nodepos

302

if p is None:

302

if p is None:

303

p = len(i) - 2

303

p = len(i) - 2

304

for r in xrange(p, -1, -1):

304

for r in xrange(p, -1, -1):

305

v = i[r][7]

305

v = i[r][7]

306

n[v] = r

306

n[v] = r

307

if v == node:

307

if v == node:

308

self._nodepos = r - 1

308

self._nodepos = r - 1

309

return r

309

return r

310

raise LookupError(node, self.indexfile, _('no node'))

310

raise LookupError(node, self.indexfile, _('no node'))

311

312

def node(self, rev):

312

def node(self, rev):

313

return self.index[rev][7]

313

return self.index[rev][7]

314

def linkrev(self, rev):

314

def linkrev(self, rev):

315

return self.index[rev][4]

315

return self.index[rev][4]

316

def parents(self, node):

316

def parents(self, node):

317

i = self.index

317

i = self.index

318

d = i[self.rev(node)]

318

d = i[self.rev(node)]

319

return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline

319

return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline

320

def parentrevs(self, rev):

320

def parentrevs(self, rev):

321

return self.index[rev][5:7]

321

return self.index[rev][5:7]

322

def start(self, rev):

322

def start(self, rev):

323

return int(self.index[rev][0] >> 16)

323

return int(self.index[rev][0] >> 16)

324

def end(self, rev):

324

def end(self, rev):

325

return self.start(rev) + self.length(rev)

325

return self.start(rev) + self.length(rev)

326

def length(self, rev):

326

def length(self, rev):

327

return self.index[rev][1]

327

return self.index[rev][1]

328

def base(self, rev):

328

def base(self, rev):

329

return self.index[rev][3]

329

return self.index[rev][3]

330

def flags(self, rev):

330

def flags(self, rev):

331

return self.index[rev][0] & 0xFFFF

331

return self.index[rev][0] & 0xFFFF

332

def rawsize(self, rev):

332

def rawsize(self, rev):

333

"""return the length of the uncompressed text for a given revision"""

333

"""return the length of the uncompressed text for a given revision"""

334

l = self.index[rev][2]

334

l = self.index[rev][2]

335

if l >= 0:

335

if l >= 0:

336

return l

336

return l

337

338

t = self.revision(self.node(rev))

338

t = self.revision(self.node(rev))

339

return len(t)

339

return len(t)

340

size = rawsize

340

size = rawsize

341

342

def reachable(self, node, stop=None):

342

def reachable(self, node, stop=None):

343

"""return the set of all nodes ancestral to a given node, including

343

"""return the set of all nodes ancestral to a given node, including

344

the node itself, stopping when stop is matched"""

344

the node itself, stopping when stop is matched"""

345

reachable = set((node,))

345

reachable = set((node,))

346

visit = [node]

346

visit = [node]

347

if stop:

347

if stop:

348

stopn = self.rev(stop)

348

stopn = self.rev(stop)

349

else:

349

else:

350

stopn = 0

350

stopn = 0

351

while visit:

351

while visit:

352

n = visit.pop(0)

352

n = visit.pop(0)

353

if n == stop:

353

if n == stop:

354

continue

354

continue

355

if n == nullid:

355

if n == nullid:

356

continue

356

continue

357

for p in self.parents(n):

357

for p in self.parents(n):

358

if self.rev(p) < stopn:

358

if self.rev(p) < stopn:

359

continue

359

continue

360

if p not in reachable:

360

if p not in reachable:

361

reachable.add(p)

361

reachable.add(p)

362

visit.append(p)

362

visit.append(p)

363

return reachable

363

return reachable

364

365

def ancestors(self, *revs):

365

def ancestors(self, *revs):

366

"""Generate the ancestors of 'revs' in reverse topological order.

366

"""Generate the ancestors of 'revs' in reverse topological order.

367

368

Yield a sequence of revision numbers starting with the parents

368

Yield a sequence of revision numbers starting with the parents

369

of each revision in revs, i.e., each revision is *not* considered

369

of each revision in revs, i.e., each revision is *not* considered

370

an ancestor of itself. Results are in breadth-first order:

370

an ancestor of itself. Results are in breadth-first order:

371

parents of each rev in revs, then parents of those, etc. Result

371

parents of each rev in revs, then parents of those, etc. Result

372

does not include the null revision."""

372

does not include the null revision."""

373

visit = list(revs)

373

visit = list(revs)

374

seen = set([nullrev])

374

seen = set([nullrev])

375

while visit:

375

while visit:

376

for parent in self.parentrevs(visit.pop(0)):

376

for parent in self.parentrevs(visit.pop(0)):

377

if parent not in seen:

377

if parent not in seen:

378

visit.append(parent)

378

visit.append(parent)

379

seen.add(parent)

379

seen.add(parent)

380

yield parent

380

yield parent

381

382

def descendants(self, *revs):

382

def descendants(self, *revs):

383

"""Generate the descendants of 'revs' in revision order.

383

"""Generate the descendants of 'revs' in revision order.

384

385

Yield a sequence of revision numbers starting with a child of

385

Yield a sequence of revision numbers starting with a child of

386

some rev in revs, i.e., each revision is *not* considered a

386

some rev in revs, i.e., each revision is *not* considered a

387

descendant of itself. Results are ordered by revision number (a

387

descendant of itself. Results are ordered by revision number (a

388

topological sort)."""

388

topological sort)."""

389

first = min(revs)

389

first = min(revs)

390

if first == nullrev:

390

if first == nullrev:

391

for i in self:

391

for i in self:

392

yield i

392

yield i

393

return

393

return

394

395

seen = set(revs)

395

seen = set(revs)

396

for i in xrange(first + 1, len(self)):

396

for i in xrange(first + 1, len(self)):

397

for x in self.parentrevs(i):

397

for x in self.parentrevs(i):

398

if x != nullrev and x in seen:

398

if x != nullrev and x in seen:

399

seen.add(i)

399

seen.add(i)

400

yield i

400

yield i

401

break

401

break

402

403

def findmissing(self, common=None, heads=None):

403

def findmissing(self, common=None, heads=None):

404

"""Return the ancestors of heads that are not ancestors of common.

404

"""Return the ancestors of heads that are not ancestors of common.

405

406

More specifically, return a list of nodes N such that every N

406

More specifically, return a list of nodes N such that every N

407

satisfies the following constraints:

407

satisfies the following constraints:

408

409

1. N is an ancestor of some node in 'heads'

409

1. N is an ancestor of some node in 'heads'

410

2. N is not an ancestor of any node in 'common'

410

2. N is not an ancestor of any node in 'common'

411

412

The list is sorted by revision number, meaning it is

412

The list is sorted by revision number, meaning it is

413

topologically sorted.

413

topologically sorted.

414

415

'heads' and 'common' are both lists of node IDs. If heads is

415

'heads' and 'common' are both lists of node IDs. If heads is

416

not supplied, uses all of the revlog's heads. If common is not

416

not supplied, uses all of the revlog's heads. If common is not

417

supplied, uses nullid."""

417

supplied, uses nullid."""

418

if common is None:

418

if common is None:

419

common = [nullid]

419

common = [nullid]

420

if heads is None:

420

if heads is None:

421

heads = self.heads()

421

heads = self.heads()

422

423

common = [self.rev(n) for n in common]

423

common = [self.rev(n) for n in common]

424

heads = [self.rev(n) for n in heads]

424

heads = [self.rev(n) for n in heads]

425

426

# we want the ancestors, but inclusive

426

# we want the ancestors, but inclusive

427

has = set(self.ancestors(*common))

427

has = set(self.ancestors(*common))

428

has.add(nullrev)

428

has.add(nullrev)

429

has.update(common)

429

has.update(common)

430

431

# take all ancestors from heads that aren't in has

431

# take all ancestors from heads that aren't in has

432

missing = set()

432

missing = set()

433

visit = [r for r in heads if r not in has]

433

visit = [r for r in heads if r not in has]

434

while visit:

434

while visit:

435

r = visit.pop(0)

435

r = visit.pop(0)

436

if r in missing:

436

if r in missing:

437

continue

437

continue

438

else:

438

else:

439

missing.add(r)

439

missing.add(r)

440

for p in self.parentrevs(r):

440

for p in self.parentrevs(r):

441

if p not in has:

441

if p not in has:

442

visit.append(p)

442

visit.append(p)

443

missing = list(missing)

443

missing = list(missing)

444

missing.sort()

444

missing.sort()

445

return [self.node(r) for r in missing]

445

return [self.node(r) for r in missing]

446

447

def nodesbetween(self, roots=None, heads=None):

447

def nodesbetween(self, roots=None, heads=None):

448

"""Return a topological path from 'roots' to 'heads'.

448

"""Return a topological path from 'roots' to 'heads'.

449

450

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

450

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

451

topologically sorted list of all nodes N that satisfy both of

451

topologically sorted list of all nodes N that satisfy both of

452

these constraints:

452

these constraints:

453

454

1. N is a descendant of some node in 'roots'

454

1. N is a descendant of some node in 'roots'

455

2. N is an ancestor of some node in 'heads'

455

2. N is an ancestor of some node in 'heads'

456

457

Every node is considered to be both a descendant and an ancestor

457

Every node is considered to be both a descendant and an ancestor

458

of itself, so every reachable node in 'roots' and 'heads' will be

458

of itself, so every reachable node in 'roots' and 'heads' will be

459

included in 'nodes'.

459

included in 'nodes'.

460

461

'outroots' is the list of reachable nodes in 'roots', i.e., the

461

'outroots' is the list of reachable nodes in 'roots', i.e., the

462

subset of 'roots' that is returned in 'nodes'. Likewise,

462

subset of 'roots' that is returned in 'nodes'. Likewise,

463

'outheads' is the subset of 'heads' that is also in 'nodes'.

463

'outheads' is the subset of 'heads' that is also in 'nodes'.

464

465

'roots' and 'heads' are both lists of node IDs. If 'roots' is

465

'roots' and 'heads' are both lists of node IDs. If 'roots' is

466

unspecified, uses nullid as the only root. If 'heads' is

466

unspecified, uses nullid as the only root. If 'heads' is

467

unspecified, uses list of all of the revlog's heads."""

467

unspecified, uses list of all of the revlog's heads."""

468

nonodes = ([], [], [])

468

nonodes = ([], [], [])

469

if roots is not None:

469

if roots is not None:

470

roots = list(roots)

470

roots = list(roots)

471

if not roots:

471

if not roots:

472

return nonodes

472

return nonodes

473

lowestrev = min([self.rev(n) for n in roots])

473

lowestrev = min([self.rev(n) for n in roots])

474

else:

474

else:

475

roots = [nullid] # Everybody's a descendent of nullid

475

roots = [nullid] # Everybody's a descendent of nullid

476

lowestrev = nullrev

476

lowestrev = nullrev

477

if (lowestrev == nullrev) and (heads is None):

477

if (lowestrev == nullrev) and (heads is None):

478

# We want _all_ the nodes!

478

# We want _all_ the nodes!

479

return ([self.node(r) for r in self], [nullid], list(self.heads()))

479

return ([self.node(r) for r in self], [nullid], list(self.heads()))

480

if heads is None:

480

if heads is None:

481

# All nodes are ancestors, so the latest ancestor is the last

481

# All nodes are ancestors, so the latest ancestor is the last

482

# node.

482

# node.

483

highestrev = len(self) - 1

483

highestrev = len(self) - 1

484

# Set ancestors to None to signal that every node is an ancestor.

484

# Set ancestors to None to signal that every node is an ancestor.

485

ancestors = None

485

ancestors = None

486

# Set heads to an empty dictionary for later discovery of heads

486

# Set heads to an empty dictionary for later discovery of heads

487

heads = {}

487

heads = {}

488

else:

488

else:

489

heads = list(heads)

489

heads = list(heads)

490

if not heads:

490

if not heads:

491

return nonodes

491

return nonodes

492

ancestors = set()

492

ancestors = set()

493

# Turn heads into a dictionary so we can remove 'fake' heads.

493

# Turn heads into a dictionary so we can remove 'fake' heads.

494

# Also, later we will be using it to filter out the heads we can't

494

# Also, later we will be using it to filter out the heads we can't

495

# find from roots.

495

# find from roots.

496

heads = dict.fromkeys(heads, 0)

496

heads = dict.fromkeys(heads, 0)

497

# Start at the top and keep marking parents until we're done.

497

# Start at the top and keep marking parents until we're done.

498

nodestotag = set(heads)

498

nodestotag = set(heads)

499

# Remember where the top was so we can use it as a limit later.

499

# Remember where the top was so we can use it as a limit later.

500

highestrev = max([self.rev(n) for n in nodestotag])

500

highestrev = max([self.rev(n) for n in nodestotag])

501

while nodestotag:

501

while nodestotag:

502

# grab a node to tag

502

# grab a node to tag

503

n = nodestotag.pop()

503

n = nodestotag.pop()

504

# Never tag nullid

504

# Never tag nullid

505

if n == nullid:

505

if n == nullid:

506

continue

506

continue

507

# A node's revision number represents its place in a

507

# A node's revision number represents its place in a

508

# topologically sorted list of nodes.

508

# topologically sorted list of nodes.

509

r = self.rev(n)

509

r = self.rev(n)

510

if r >= lowestrev:

510

if r >= lowestrev:

511

if n not in ancestors:

511

if n not in ancestors:

512

# If we are possibly a descendent of one of the roots

512

# If we are possibly a descendent of one of the roots

513

# and we haven't already been marked as an ancestor

513

# and we haven't already been marked as an ancestor

514

ancestors.add(n) # Mark as ancestor

514

ancestors.add(n) # Mark as ancestor

515

# Add non-nullid parents to list of nodes to tag.

515

# Add non-nullid parents to list of nodes to tag.

516

nodestotag.update([p for p in self.parents(n) if

516

nodestotag.update([p for p in self.parents(n) if

517

p != nullid])

517

p != nullid])

518

elif n in heads: # We've seen it before, is it a fake head?

518

elif n in heads: # We've seen it before, is it a fake head?

519

# So it is, real heads should not be the ancestors of

519

# So it is, real heads should not be the ancestors of

520

# any other heads.

520

# any other heads.

521

heads.pop(n)

521

heads.pop(n)

522

if not ancestors:

522

if not ancestors:

523

return nonodes

523

return nonodes

524

# Now that we have our set of ancestors, we want to remove any

524

# Now that we have our set of ancestors, we want to remove any

525

# roots that are not ancestors.

525

# roots that are not ancestors.

526

527

# If one of the roots was nullid, everything is included anyway.

527

# If one of the roots was nullid, everything is included anyway.

528

if lowestrev > nullrev:

528

if lowestrev > nullrev:

529

# But, since we weren't, let's recompute the lowest rev to not

529

# But, since we weren't, let's recompute the lowest rev to not

530

# include roots that aren't ancestors.

530

# include roots that aren't ancestors.

531

532

# Filter out roots that aren't ancestors of heads

532

# Filter out roots that aren't ancestors of heads

533

roots = [n for n in roots if n in ancestors]

533

roots = [n for n in roots if n in ancestors]

534

# Recompute the lowest revision

534

# Recompute the lowest revision

535

if roots:

535

if roots:

536

lowestrev = min([self.rev(n) for n in roots])

536

lowestrev = min([self.rev(n) for n in roots])

537

else:

537

else:

538

# No more roots? Return empty list

538

# No more roots? Return empty list

539

return nonodes

539

return nonodes

540

else:

540

else:

541

# We are descending from nullid, and don't need to care about

541

# We are descending from nullid, and don't need to care about

542

# any other roots.

542

# any other roots.

543

lowestrev = nullrev

543

lowestrev = nullrev

544

roots = [nullid]

544

roots = [nullid]

545

# Transform our roots list into a set.

545

# Transform our roots list into a set.

546

descendents = set(roots)

546

descendents = set(roots)

547

# Also, keep the original roots so we can filter out roots that aren't

547

# Also, keep the original roots so we can filter out roots that aren't

548

# 'real' roots (i.e. are descended from other roots).

548

# 'real' roots (i.e. are descended from other roots).

549

roots = descendents.copy()

549

roots = descendents.copy()

550

# Our topologically sorted list of output nodes.

550

# Our topologically sorted list of output nodes.

551

orderedout = []

551

orderedout = []

552

# Don't start at nullid since we don't want nullid in our output list,

552

# Don't start at nullid since we don't want nullid in our output list,

553

# and if nullid shows up in descedents, empty parents will look like

553

# and if nullid shows up in descedents, empty parents will look like

554

# they're descendents.

554

# they're descendents.

555

for r in xrange(max(lowestrev, 0), highestrev + 1):

555

for r in xrange(max(lowestrev, 0), highestrev + 1):

556

n = self.node(r)

556

n = self.node(r)

557

isdescendent = False

557

isdescendent = False

558

if lowestrev == nullrev: # Everybody is a descendent of nullid

558

if lowestrev == nullrev: # Everybody is a descendent of nullid

559

isdescendent = True

559

isdescendent = True

560

elif n in descendents:

560

elif n in descendents:

561

# n is already a descendent

561

# n is already a descendent

562

isdescendent = True

562

isdescendent = True

563

# This check only needs to be done here because all the roots

563

# This check only needs to be done here because all the roots

564

# will start being marked is descendents before the loop.

564

# will start being marked is descendents before the loop.

565

if n in roots:

565

if n in roots:

566

# If n was a root, check if it's a 'real' root.

566

# If n was a root, check if it's a 'real' root.

567

p = tuple(self.parents(n))

567

p = tuple(self.parents(n))

568

# If any of its parents are descendents, it's not a root.

568

# If any of its parents are descendents, it's not a root.

569

if (p[0] in descendents) or (p[1] in descendents):

569

if (p[0] in descendents) or (p[1] in descendents):

570

roots.remove(n)

570

roots.remove(n)

571

else:

571

else:

572

p = tuple(self.parents(n))

572

p = tuple(self.parents(n))

573

# A node is a descendent if either of its parents are

573

# A node is a descendent if either of its parents are

574

# descendents. (We seeded the dependents list with the roots

574

# descendents. (We seeded the dependents list with the roots

575

# up there, remember?)

575

# up there, remember?)

576

if (p[0] in descendents) or (p[1] in descendents):

576

if (p[0] in descendents) or (p[1] in descendents):

577

descendents.add(n)

577

descendents.add(n)

578

isdescendent = True

578

isdescendent = True

579

if isdescendent and ((ancestors is None) or (n in ancestors)):

579

if isdescendent and ((ancestors is None) or (n in ancestors)):

580

# Only include nodes that are both descendents and ancestors.

580

# Only include nodes that are both descendents and ancestors.

581

orderedout.append(n)

581

orderedout.append(n)

582

if (ancestors is not None) and (n in heads):

582

if (ancestors is not None) and (n in heads):

583

# We're trying to figure out which heads are reachable

583

# We're trying to figure out which heads are reachable

584

# from roots.

584

# from roots.

585

# Mark this head as having been reached

585

# Mark this head as having been reached

586

heads[n] = 1

586

heads[n] = 1

587

elif ancestors is None:

587

elif ancestors is None:

588

# Otherwise, we're trying to discover the heads.

588

# Otherwise, we're trying to discover the heads.

589

# Assume this is a head because if it isn't, the next step

589

# Assume this is a head because if it isn't, the next step

590

# will eventually remove it.

590

# will eventually remove it.

591

heads[n] = 1

591

heads[n] = 1

592

# But, obviously its parents aren't.

592

# But, obviously its parents aren't.

593

for p in self.parents(n):

593

for p in self.parents(n):

594

heads.pop(p, None)

594

heads.pop(p, None)

595

heads = [n for n in heads.iterkeys() if heads[n] != 0]

595

heads = [n for n in heads.iterkeys() if heads[n] != 0]

596

roots = list(roots)

596

roots = list(roots)

597

assert orderedout

597

assert orderedout

598

assert roots

598

assert roots

599

assert heads

599

assert heads

600

return (orderedout, roots, heads)

600

return (orderedout, roots, heads)

601

602

def heads(self, start=None, stop=None):

602

def heads(self, start=None, stop=None):

603

"""return the list of all nodes that have no children

603

"""return the list of all nodes that have no children

604

605

if start is specified, only heads that are descendants of

605

if start is specified, only heads that are descendants of

606

start will be returned

606

start will be returned

607

if stop is specified, it will consider all the revs from stop

607

if stop is specified, it will consider all the revs from stop

608

as if they had no children

608

as if they had no children

609

"""

609

"""

610

if start is None and stop is None:

610

if start is None and stop is None:

611

count = len(self)

611

count = len(self)

612

if not count:

612

if not count:

613

return [nullid]

613

return [nullid]

614

ishead = [1] * (count + 1)

614

ishead = [1] * (count + 1)

615

index = self.index

615

index = self.index

616

for r in xrange(count):

616

for r in xrange(count):

617

e = index[r]

617

e = index[r]

618

ishead[e[5]] = ishead[e[6]] = 0

618

ishead[e[5]] = ishead[e[6]] = 0

619

return [self.node(r) for r in xrange(count) if ishead[r]]

619

return [self.node(r) for r in xrange(count) if ishead[r]]

620

621

if start is None:

621

if start is None:

622

start = nullid

622

start = nullid

623

if stop is None:

623

if stop is None:

624

stop = []

624

stop = []

625

stoprevs = set([self.rev(n) for n in stop])

625

stoprevs = set([self.rev(n) for n in stop])

626

startrev = self.rev(start)

626

startrev = self.rev(start)

627

reachable = set((startrev,))

627

reachable = set((startrev,))

628

heads = set((startrev,))

628

heads = set((startrev,))

629

630

parentrevs = self.parentrevs

630

parentrevs = self.parentrevs

631

for r in xrange(startrev + 1, len(self)):

631

for r in xrange(startrev + 1, len(self)):

632

for p in parentrevs(r):

632

for p in parentrevs(r):

633

if p in reachable:

633

if p in reachable:

634

if r not in stoprevs:

634

if r not in stoprevs:

635

reachable.add(r)

635

reachable.add(r)

636

heads.add(r)

636

heads.add(r)

637

if p in heads and p not in stoprevs:

637

if p in heads and p not in stoprevs:

638

heads.remove(p)

638

heads.remove(p)

639

640

return [self.node(r) for r in heads]

640

return [self.node(r) for r in heads]

641

642

def children(self, node):

642

def children(self, node):

643

"""find the children of a given node"""

643

"""find the children of a given node"""

644

c = []

644

c = []

645

p = self.rev(node)

645

p = self.rev(node)

646

for r in range(p + 1, len(self)):

646

for r in range(p + 1, len(self)):

647

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

647

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

648

if prevs:

648

if prevs:

649

for pr in prevs:

649

for pr in prevs:

650

if pr == p:

650

if pr == p:

651

c.append(self.node(r))

651

c.append(self.node(r))

652

elif p == nullrev:

652

elif p == nullrev:

653

c.append(self.node(r))

653

c.append(self.node(r))

654

return c

654

return c

655

656

def descendant(self, start, end):

656

def descendant(self, start, end):

657

if start == nullrev:

657

if start == nullrev:

658

return True

658

return True

659

for i in self.descendants(start):

659

for i in self.descendants(start):

660

if i == end:

660

if i == end:

661

return True

661

return True

662

elif i > end:

662

elif i > end:

663

break

663

break

664

return False

664

return False

665

666

def ancestor(self, a, b):

666

def ancestor(self, a, b):

667

"""calculate the least common ancestor of nodes a and b"""

667

"""calculate the least common ancestor of nodes a and b"""

668

669

# fast path, check if it is a descendant

669

# fast path, check if it is a descendant

670

a, b = self.rev(a), self.rev(b)

670

a, b = self.rev(a), self.rev(b)

671

start, end = sorted((a, b))

671

start, end = sorted((a, b))

672

if self.descendant(start, end):

672

if self.descendant(start, end):

673

return self.node(start)

673

return self.node(start)

674

675

def parents(rev):

675

def parents(rev):

676

return [p for p in self.parentrevs(rev) if p != nullrev]

676

return [p for p in self.parentrevs(rev) if p != nullrev]

677

678

c = ancestor.ancestor(a, b, parents)

678

c = ancestor.ancestor(a, b, parents)

679

if c is None:

679

if c is None:

680

return nullid

680

return nullid

681

682

return self.node(c)

682

return self.node(c)

683

684

def _match(self, id):

684

def _match(self, id):

685

if isinstance(id, (long, int)):

685

if isinstance(id, (long, int)):

686

# rev

686

# rev

687

return self.node(id)

687

return self.node(id)

688

if len(id) == 20:

688

if len(id) == 20:

689

# possibly a binary node

689

# possibly a binary node

690

# odds of a binary node being all hex in ASCII are 1 in 10**25

690

# odds of a binary node being all hex in ASCII are 1 in 10**25

691

try:

691

try:

692

node = id

692

node = id

693

self.rev(node) # quick search the index

693

self.rev(node) # quick search the index

694

return node

694

return node

695

except LookupError:

695

except LookupError:

696

pass # may be partial hex id

696

pass # may be partial hex id

697

try:

697

try:

698

# str(rev)

698

# str(rev)

699

rev = int(id)

699

rev = int(id)

700

if str(rev) != id:

700

if str(rev) != id:

701

raise ValueError

701

raise ValueError

702

if rev < 0:

702

if rev < 0:

703

rev = len(self) + rev

703

rev = len(self) + rev

704

if rev < 0 or rev >= len(self):

704

if rev < 0 or rev >= len(self):

705

raise ValueError

705

raise ValueError

706

return self.node(rev)

706

return self.node(rev)

707

except (ValueError, OverflowError):

707

except (ValueError, OverflowError):

708

pass

708

pass

709

if len(id) == 40:

709

if len(id) == 40:

710

try:

710

try:

711

# a full hex nodeid?

711

# a full hex nodeid?

712

node = bin(id)

712

node = bin(id)

713

self.rev(node)

713

self.rev(node)

714

return node

714

return node

715

except (TypeError, LookupError):

715

except (TypeError, LookupError):

716

pass

716

pass

717

718

def _partialmatch(self, id):

718

def _partialmatch(self, id):

719

if id in self._pcache:

719

if id in self._pcache:

720

return self._pcache[id]

720

return self._pcache[id]

721

722

if len(id) < 40:

722

if len(id) < 40:

723

try:

723

try:

724

# hex(node)[:...]

724

# hex(node)[:...]

725

l = len(id) // 2 # grab an even number of digits

725

l = len(id) // 2 # grab an even number of digits

726

prefix = bin(id[:l * 2])

726

prefix = bin(id[:l * 2])

727

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

727

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

728

nl = [n for n in nl if hex(n).startswith(id)]

728

nl = [n for n in nl if hex(n).startswith(id)]

729

if len(nl) > 0:

729

if len(nl) > 0:

730

if len(nl) == 1:

730

if len(nl) == 1:

731

self._pcache[id] = nl[0]

731

self._pcache[id] = nl[0]

732

return nl[0]

732

return nl[0]

733

raise LookupError(id, self.indexfile,

733

raise LookupError(id, self.indexfile,

734

_('ambiguous identifier'))

734

_('ambiguous identifier'))

735

return None

735

return None

736

except TypeError:

736

except TypeError:

737

pass

737

pass

738

739

def lookup(self, id):

739

def lookup(self, id):

740

"""locate a node based on:

740

"""locate a node based on:

741

- revision number or str(revision number)

741

- revision number or str(revision number)

742

- nodeid or subset of hex nodeid

742

- nodeid or subset of hex nodeid

743

"""

743

"""

744

n = self._match(id)

744

n = self._match(id)

745

if n is not None:

745

if n is not None:

746

return n

746

return n

747

n = self._partialmatch(id)

747

n = self._partialmatch(id)

748

if n:

748

if n:

749

return n

749

return n

750

751

raise LookupError(id, self.indexfile, _('no match found'))

751

raise LookupError(id, self.indexfile, _('no match found'))

752

753

def cmp(self, node, text):

753

def cmp(self, node, text):

754

"""compare text with a given file revision

754

"""compare text with a given file revision

755

756

returns True if text is different than what is stored.

756

returns True if text is different than what is stored.

757

"""

757

"""

758

p1, p2 = self.parents(node)

758

p1, p2 = self.parents(node)

759

return hash(text, p1, p2) != node

759

return hash(text, p1, p2) != node

760

761

def _addchunk(self, offset, data):

761

def _addchunk(self, offset, data):

762

o, d = self._chunkcache

762

o, d = self._chunkcache

763

# try to add to existing cache

763

# try to add to existing cache

764

if o + len(d) == offset and len(d) + len(data) < _chunksize:

764

if o + len(d) == offset and len(d) + len(data) < _chunksize:

765

self._chunkcache = o, d + data

765

self._chunkcache = o, d + data

766

else:

766

else:

767

self._chunkcache = offset, data

767

self._chunkcache = offset, data

768

769

def _loadchunk(self, offset, length):

769

def _loadchunk(self, offset, length):

770

if self._inline:

770

if self._inline:

771

df = self.opener(self.indexfile)

771

df = self.opener(self.indexfile)

772

else:

772

else:

773

df = self.opener(self.datafile)

773

df = self.opener(self.datafile)

774

775

readahead = max(65536, length)

775

readahead = max(65536, length)

776

df.seek(offset)

776

df.seek(offset)

777

d = df.read(readahead)

777

d = df.read(readahead)

778

self._addchunk(offset, d)

778

self._addchunk(offset, d)

779

if readahead > length:

779

if readahead > length:

780

return d[:length]

780

return d[:length]

781

return d

781

return d

782

783

def _getchunk(self, offset, length):

783

def _getchunk(self, offset, length):

784

o, d = self._chunkcache

784

o, d = self._chunkcache

785

l = len(d)

785

l = len(d)

786

787

# is it in the cache?

787

# is it in the cache?

788

cachestart = offset - o

788

cachestart = offset - o

789

cacheend = cachestart + length

789

cacheend = cachestart + length

790

if cachestart >= 0 and cacheend <= l:

790

if cachestart >= 0 and cacheend <= l:

791

if cachestart == 0 and cacheend == l:

791

if cachestart == 0 and cacheend == l:

792

return d # avoid a copy

792

return d # avoid a copy

793

return d[cachestart:cacheend]

793

return d[cachestart:cacheend]

794

795

return self._loadchunk(offset, length)

795

return self._loadchunk(offset, length)

796

797

def _chunkraw(self, startrev, endrev):

797

def _chunkraw(self, startrev, endrev):

798

start = self.start(startrev)

798

start = self.start(startrev)

799

length = self.end(endrev) - start

799

length = self.end(endrev) - start

800

if self._inline:

800

if self._inline:

801

start += (startrev + 1) * self._io.size

801

start += (startrev + 1) * self._io.size

802

return self._getchunk(start, length)

802

return self._getchunk(start, length)

803

804

def _chunk(self, rev):

804

def _chunk(self, rev):

805

return decompress(self._chunkraw(rev, rev))

805

return decompress(self._chunkraw(rev, rev))

806

807

def _chunkclear(self):

807

def _chunkclear(self):

808

self._chunkcache = (0, '')

808

self._chunkcache = (0, '')

809

810

def deltaparent(self, rev):

810

def deltaparent(self, rev):

811

"""return previous revision or parentrev according to flags"""

811

"""return previous revision or parentrev according to flags"""

812

if self.flags(rev) & REVIDX_PARENTDELTA:

812

if self.flags(rev) & REVIDX_PARENTDELTA:

813

return self.parentrevs(rev)[0]

813

return self.parentrevs(rev)[0]

814

else:

814

else:

815

return rev - 1

815

return rev - 1

816

817

def revdiff(self, rev1, rev2):

817

def revdiff(self, rev1, rev2):

818

"""return or calculate a delta between two revisions"""

818

"""return or calculate a delta between two revisions"""

819

if self.base(rev2) != rev2 and self.deltaparent(rev2) == rev1:

819

if self.base(rev2) != rev2 and self.deltaparent(rev2) == rev1:

820

return self._chunk(rev2)

820

return self._chunk(rev2)

821

822

return mdiff.textdiff(self.revision(self.node(rev1)),

822

return mdiff.textdiff(self.revision(self.node(rev1)),

823

self.revision(self.node(rev2)))

823

self.revision(self.node(rev2)))

824

825

def revision(self, node):

825

def revision(self, node):

826

"""return an uncompressed revision of a given node"""

826

"""return an uncompressed revision of a given node"""

827

cachedrev = None

827

cachedrev = None

828

if node == nullid:

828

if node == nullid:

829

return ""

829

return ""

830

if self._cache:

830

if self._cache:

831

if self._cache[0] == node:

831

if self._cache[0] == node:

832

return self._cache[2]

832

return self._cache[2]

833

cachedrev = self._cache[1]

833

cachedrev = self._cache[1]

834

835

# look up what we need to read

835

# look up what we need to read

836

text = None

836

text = None

837

rev = self.rev(node)

837

rev = self.rev(node)

838

base = self.base(rev)

838

base = self.base(rev)

839

840

# check rev flags

840

# check rev flags

841

if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:

841

if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:

842

raise RevlogError(_('incompatible revision flag %x') %

842

raise RevlogError(_('incompatible revision flag %x') %

843

(self.flags(rev) & ~REVIDX_KNOWN_FLAGS))

843

(self.flags(rev) & ~REVIDX_KNOWN_FLAGS))

844

845

# build delta chain

845

# build delta chain

846

chain = []

846

chain = []

847

index = self.index # for performance

847

index = self.index # for performance

848

iterrev = rev

848

iterrev = rev

849

e = index[iterrev]

849

e = index[iterrev]

850

while iterrev != base and iterrev != cachedrev:

850

while iterrev != base and iterrev != cachedrev:

851

chain.append(iterrev)

851

chain.append(iterrev)

852

if e[0] & REVIDX_PARENTDELTA:

852

if e[0] & REVIDX_PARENTDELTA:

853

iterrev = e[5]

853

iterrev = e[5]

854

else:

854

else:

855

iterrev -= 1

855

iterrev -= 1

856

e = index[iterrev]

856

e = index[iterrev]

857

chain.reverse()

857

chain.reverse()

858

base = iterrev

858

base = iterrev

859

860

if iterrev == cachedrev:

860

if iterrev == cachedrev:

861

# cache hit

861

# cache hit

862

text = self._cache[2]

862

text = self._cache[2]

863

864

# drop cache to save memory

864

# drop cache to save memory

865

self._cache = None

865

self._cache = None

866

867

self._chunkraw(base, rev)

867

self._chunkraw(base, rev)

868

if text is None:

868

if text is None:

869

text = self._chunk(base)

869

text = self._chunk(base)

870

871

bins = [self._chunk(r) for r in chain]

871

bins = [self._chunk(r) for r in chain]

872

text = mdiff.patches(text, bins)

872

text = mdiff.patches(text, bins)

873

874

text = self._checkhash(text, node)

874

text = self._checkhash(text, node, rev)

875

876

self._cache = (node, rev, text)

876

self._cache = (node, rev, text)

877

return text

877

return text

878

879

def _checkhash(self, text, node):

879

def _checkhash(self, text, node, rev):

880

p1, p2 = self.parents(node)

880

p1, p2 = self.parents(node)

881

if (node != hash(text, p1, p2) and

881

if (node != hash(text, p1, p2) and

882

not (self.flags(rev) & REVIDX_PUNCHED_FLAG)):

882

not (self.flags(rev) & REVIDX_PUNCHED_FLAG)):

883

raise RevlogError(_("integrity check failed on %s:%d")

883

raise RevlogError(_("integrity check failed on %s:%d")

884

% (self.indexfile, rev))

884

% (self.indexfile, rev))

885

return text

885

return text

886

887

def checkinlinesize(self, tr, fp=None):

887

def checkinlinesize(self, tr, fp=None):

888

if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:

888

if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:

889

return

889

return

890

891

trinfo = tr.find(self.indexfile)

891

trinfo = tr.find(self.indexfile)

892

if trinfo is None:

892

if trinfo is None:

893

raise RevlogError(_("%s not found in the transaction")

893

raise RevlogError(_("%s not found in the transaction")

894

% self.indexfile)

894

% self.indexfile)

895

896

trindex = trinfo[2]

896

trindex = trinfo[2]

897

dataoff = self.start(trindex)

897

dataoff = self.start(trindex)

898

899

tr.add(self.datafile, dataoff)

899

tr.add(self.datafile, dataoff)

900

901

if fp:

901

if fp:

902

fp.flush()

902

fp.flush()

903

fp.close()

903

fp.close()

904

905

df = self.opener(self.datafile, 'w')

905

df = self.opener(self.datafile, 'w')

906

try:

906

try:

907

for r in self:

907

for r in self:

908

df.write(self._chunkraw(r, r))

908

df.write(self._chunkraw(r, r))

909

finally:

909

finally:

910

df.close()

910

df.close()

911

912

fp = self.opener(self.indexfile, 'w', atomictemp=True)

912

fp = self.opener(self.indexfile, 'w', atomictemp=True)

913

self.version &= ~(REVLOGNGINLINEDATA)

913

self.version &= ~(REVLOGNGINLINEDATA)

914

self._inline = False

914

self._inline = False

915

for i in self:

915

for i in self:

916

e = self._io.packentry(self.index[i], self.node, self.version, i)

916

e = self._io.packentry(self.index[i], self.node, self.version, i)

917

fp.write(e)

917

fp.write(e)

918

919

# if we don't call rename, the temp file will never replace the

919

# if we don't call rename, the temp file will never replace the

920

# real index

920

# real index

921

fp.rename()

921

fp.rename()

922

923

tr.replace(self.indexfile, trindex * self._io.size)

923

tr.replace(self.indexfile, trindex * self._io.size)

924

self._chunkclear()

924

self._chunkclear()

925

926

def addrevision(self, text, transaction, link, p1, p2, cachedelta=None):

926

def addrevision(self, text, transaction, link, p1, p2, cachedelta=None):

927

"""add a revision to the log

927

"""add a revision to the log

928

929

text - the revision data to add

929

text - the revision data to add

930

transaction - the transaction object used for rollback

930

transaction - the transaction object used for rollback

931

link - the linkrev data to add

931

link - the linkrev data to add

932

p1, p2 - the parent nodeids of the revision

932

p1, p2 - the parent nodeids of the revision

933

cachedelta - an optional precomputed delta

933

cachedelta - an optional precomputed delta

934

"""

934

"""

935

node = hash(text, p1, p2)

935

node = hash(text, p1, p2)

936

if (node in self.nodemap and

936

if (node in self.nodemap and

937

(not self.flags(self.rev(node)) & REVIDX_PUNCHED_FLAG)):

937

(not self.flags(self.rev(node)) & REVIDX_PUNCHED_FLAG)):

938

return node

938

return node

939

940

dfh = None

940

dfh = None

941

if not self._inline:

941

if not self._inline:

942

dfh = self.opener(self.datafile, "a")

942

dfh = self.opener(self.datafile, "a")

943

ifh = self.opener(self.indexfile, "a+")

943

ifh = self.opener(self.indexfile, "a+")

944

try:

944

try:

945

return self._addrevision(node, text, transaction, link, p1, p2,

945

return self._addrevision(node, text, transaction, link, p1, p2,

946

cachedelta, ifh, dfh)

946

cachedelta, ifh, dfh)

947

finally:

947

finally:

948

if dfh:

948

if dfh:

949

dfh.close()

949

dfh.close()

950

ifh.close()

950

ifh.close()

951

952

def _addrevision(self, node, text, transaction, link, p1, p2,

952

def _addrevision(self, node, text, transaction, link, p1, p2,

953

cachedelta, ifh, dfh):

953

cachedelta, ifh, dfh):

954

955

btext = [text]

955

btext = [text]

956

def buildtext():

956

def buildtext():

957

if btext[0] is not None:

957

if btext[0] is not None:

958

return btext[0]

958

return btext[0]

959

# flush any pending writes here so we can read it in revision

959

# flush any pending writes here so we can read it in revision

960

if dfh:

960

if dfh:

961

dfh.flush()

961

dfh.flush()

962

ifh.flush()

962

ifh.flush()

963

basetext = self.revision(self.node(cachedelta[0]))

963

basetext = self.revision(self.node(cachedelta[0]))

964

btext[0] = mdiff.patch(basetext, cachedelta[1])

964

btext[0] = mdiff.patch(basetext, cachedelta[1])

965

chk = hash(btext[0], p1, p2)

965

chk = hash(btext[0], p1, p2)

966

if chk != node:

966

if chk != node:

967

raise RevlogError(_("consistency error in delta"))

967

raise RevlogError(_("consistency error in delta"))

968

return btext[0]

968

return btext[0]

969

970

def builddelta(rev):

970

def builddelta(rev):

971

# can we use the cached delta?

971

# can we use the cached delta?

972

if cachedelta and cachedelta[0] == rev:

972

if cachedelta and cachedelta[0] == rev:

973

delta = cachedelta[1]

973

delta = cachedelta[1]

974

else:

974

else:

975

t = buildtext()

975

t = buildtext()

976

ptext = self.revision(self.node(rev))

976

ptext = self.revision(self.node(rev))

977

delta = mdiff.textdiff(ptext, t)

977

delta = mdiff.textdiff(ptext, t)

978

data = compress(delta)

978

data = compress(delta)

979

l = len(data[1]) + len(data[0])

979

l = len(data[1]) + len(data[0])

980

base = self.base(rev)

980

base = self.base(rev)

981

dist = l + offset - self.start(base)

981

dist = l + offset - self.start(base)

982

return dist, l, data, base

982

return dist, l, data, base

983

984

curr = len(self)

984

curr = len(self)

985

prev = curr - 1

985

prev = curr - 1

986

base = curr

986

base = curr

987

offset = self.end(prev)

987

offset = self.end(prev)

988

flags = 0

988

flags = 0

989

d = None

989

d = None

990

p1r, p2r = self.rev(p1), self.rev(p2)

990

p1r, p2r = self.rev(p1), self.rev(p2)

991

992

# should we try to build a delta?

992

# should we try to build a delta?

993

if prev != nullrev:

993

if prev != nullrev:

994

d = builddelta(prev)

994

d = builddelta(prev)

995

if self._parentdelta and prev != p1r:

995

if self._parentdelta and prev != p1r:

996

d2 = builddelta(p1r)

996

d2 = builddelta(p1r)

997

if d2 < d:

997

if d2 < d:

998

d = d2

998

d = d2

999

flags = REVIDX_PARENTDELTA

999

flags = REVIDX_PARENTDELTA

1000

dist, l, data, base = d

1000

dist, l, data, base = d

1001

1002

# full versions are inserted when the needed deltas

1002

# full versions are inserted when the needed deltas

1003

# become comparable to the uncompressed text

1003

# become comparable to the uncompressed text

1004

# or the base revision is punched

1004

# or the base revision is punched

1005

if text is None:

1005

if text is None:

1006

textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),

1006

textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),

1007

cachedelta[1])

1007

cachedelta[1])

1008

else:

1008

else:

1009

textlen = len(text)

1009

textlen = len(text)

1010

if (d is None or dist > textlen * 2 or

1010

if (d is None or dist > textlen * 2 or

1011

(self.flags(base) & REVIDX_PUNCHED_FLAG)):

1011

(self.flags(base) & REVIDX_PUNCHED_FLAG)):

1012

text = buildtext()

1012

text = buildtext()

1013

data = compress(text)

1013

data = compress(text)

1014

l = len(data[1]) + len(data[0])

1014

l = len(data[1]) + len(data[0])

1015

base = curr

1015

base = curr

1016

1017

e = (offset_type(offset, flags), l, textlen,

1017

e = (offset_type(offset, flags), l, textlen,

1018

base, link, p1r, p2r, node)

1018

base, link, p1r, p2r, node)

1019

self.index.insert(-1, e)

1019

self.index.insert(-1, e)

1020

self.nodemap[node] = curr

1020

self.nodemap[node] = curr

1021

1022

entry = self._io.packentry(e, self.node, self.version, curr)

1022

entry = self._io.packentry(e, self.node, self.version, curr)

1023

if not self._inline:

1023

if not self._inline:

1024

transaction.add(self.datafile, offset)

1024

transaction.add(self.datafile, offset)

1025

transaction.add(self.indexfile, curr * len(entry))

1025

transaction.add(self.indexfile, curr * len(entry))

1026

if data[0]:

1026

if data[0]:

1027

dfh.write(data[0])

1027

dfh.write(data[0])

1028

dfh.write(data[1])

1028

dfh.write(data[1])

1029

dfh.flush()

1029

dfh.flush()

1030

ifh.write(entry)

1030

ifh.write(entry)

1031

else:

1031

else:

1032

offset += curr * self._io.size

1032

offset += curr * self._io.size

1033

transaction.add(self.indexfile, offset, curr)

1033

transaction.add(self.indexfile, offset, curr)

1034

ifh.write(entry)

1034

ifh.write(entry)

1035

ifh.write(data[0])

1035

ifh.write(data[0])

1036

ifh.write(data[1])

1036

ifh.write(data[1])

1037

self.checkinlinesize(transaction, ifh)

1037

self.checkinlinesize(transaction, ifh)

1038

1039

if type(text) == str: # only accept immutable objects

1039

if type(text) == str: # only accept immutable objects

1040

self._cache = (node, curr, text)

1040

self._cache = (node, curr, text)

1041

return node

1041

return node

1042

1043

def group(self, nodelist, lookup, infocollect=None, fullrev=False):

1043

def group(self, nodelist, lookup, infocollect=None, fullrev=False):

1044

"""Calculate a delta group, yielding a sequence of changegroup chunks

1044

"""Calculate a delta group, yielding a sequence of changegroup chunks

1045

(strings).

1045

(strings).

1046

1047

Given a list of changeset revs, return a set of deltas and

1047

Given a list of changeset revs, return a set of deltas and

1048

metadata corresponding to nodes. The first delta is

1048

metadata corresponding to nodes. The first delta is

1049

first parent(nodelist[0]) -> nodelist[0], the receiver is

1049

first parent(nodelist[0]) -> nodelist[0], the receiver is

1050

guaranteed to have this parent as it has all history before

1050

guaranteed to have this parent as it has all history before

1051

these changesets. In the case firstparent is nullrev the

1051

these changesets. In the case firstparent is nullrev the

1052

changegroup starts with a full revision.

1052

changegroup starts with a full revision.

1053

fullrev forces the insertion of the full revision, necessary

1053

fullrev forces the insertion of the full revision, necessary

1054

in the case of shallow clones where the first parent might

1054

in the case of shallow clones where the first parent might

1055

not exist at the reciever.

1055

not exist at the reciever.

1056

"""

1056

"""

1057

1058

revs = [self.rev(n) for n in nodelist]

1058

revs = [self.rev(n) for n in nodelist]

1059

1060

# if we don't have any revisions touched by these changesets, bail

1060

# if we don't have any revisions touched by these changesets, bail

1061

if not revs:

1061

if not revs:

1062

yield changegroup.closechunk()

1062

yield changegroup.closechunk()

1063

return

1063

return

1064

1065

# add the parent of the first rev

1065

# add the parent of the first rev

1066

p = self.parentrevs(revs[0])[0]

1066

p = self.parentrevs(revs[0])[0]

1067

revs.insert(0, p)

1067

revs.insert(0, p)

1068

if p == nullrev:

1068

if p == nullrev:

1069

fullrev = True

1069

fullrev = True

1070

1071

# build deltas

1071

# build deltas

1072

for d in xrange(len(revs) - 1):

1072

for d in xrange(len(revs) - 1):

1073

a, b = revs[d], revs[d + 1]

1073

a, b = revs[d], revs[d + 1]

1074

nb = self.node(b)

1074

nb = self.node(b)

1075

1076

if infocollect is not None:

1076

if infocollect is not None:

1077

infocollect(nb)

1077

infocollect(nb)

1078

1079

p = self.parents(nb)

1079

p = self.parents(nb)

1080

meta = nb + p[0] + p[1] + lookup(nb)

1080

meta = nb + p[0] + p[1] + lookup(nb)

1081

if fullrev:

1081

if fullrev:

1082

d = self.revision(nb)

1082

d = self.revision(nb)

1083

meta += mdiff.trivialdiffheader(len(d))

1083

meta += mdiff.trivialdiffheader(len(d))

1084

fullrev = False

1084

fullrev = False

1085

else:

1085

else:

1086

d = self.revdiff(a, b)

1086

d = self.revdiff(a, b)

1087

yield changegroup.chunkheader(len(meta) + len(d))

1087

yield changegroup.chunkheader(len(meta) + len(d))

1088

yield meta

1088

yield meta

1089

yield d

1089

yield d

1090

1091

yield changegroup.closechunk()

1091

yield changegroup.closechunk()

1092

1093

def addgroup(self, bundle, linkmapper, transaction):

1093

def addgroup(self, bundle, linkmapper, transaction):

1094

"""

1094

"""

1095

add a delta group

1095

add a delta group

1096

1097

given a set of deltas, add them to the revision log. the

1097

given a set of deltas, add them to the revision log. the

1098

first delta is against its parent, which should be in our

1098

first delta is against its parent, which should be in our

1099

log, the rest are against the previous delta.

1099

log, the rest are against the previous delta.

1100

"""

1100

"""

1101

1102

# track the base of the current delta log

1102

# track the base of the current delta log

1103

node = None

1103

node = None

1104

1105

r = len(self)

1105

r = len(self)

1106

end = 0

1106

end = 0

1107

if r:

1107

if r:

1108

end = self.end(r - 1)

1108

end = self.end(r - 1)

1109

ifh = self.opener(self.indexfile, "a+")

1109

ifh = self.opener(self.indexfile, "a+")

1110

isize = r * self._io.size

1110

isize = r * self._io.size

1111

if self._inline:

1111

if self._inline:

1112

transaction.add(self.indexfile, end + isize, r)

1112

transaction.add(self.indexfile, end + isize, r)

1113

dfh = None

1113

dfh = None

1114

else:

1114

else:

1115

transaction.add(self.indexfile, isize, r)

1115

transaction.add(self.indexfile, isize, r)

1116

transaction.add(self.datafile, end)

1116

transaction.add(self.datafile, end)

1117

dfh = self.opener(self.datafile, "a")

1117

dfh = self.opener(self.datafile, "a")

1118

1119

try:

1119

try:

1120

# loop through our set of deltas

1120

# loop through our set of deltas

1121

chain = None

1121

chain = None

1122

while 1:

1122

while 1:

1123

chunkdata = bundle.parsechunk()

1123

chunkdata = bundle.parsechunk()

1124

if not chunkdata:

1124

if not chunkdata:

1125

break

1125

break

1126

node = chunkdata['node']

1126

node = chunkdata['node']

1127

p1 = chunkdata['p1']

1127

p1 = chunkdata['p1']

1128

p2 = chunkdata['p2']

1128

p2 = chunkdata['p2']

1129

cs = chunkdata['cs']

1129

cs = chunkdata['cs']

1130

delta = chunkdata['data']

1130

delta = chunkdata['data']

1131

1132

link = linkmapper(cs)

1132

link = linkmapper(cs)

1133

if (node in self.nodemap and

1133

if (node in self.nodemap and

1134

(not self.flags(self.rev(node)) & REVIDX_PUNCHED_FLAG)):

1134

(not self.flags(self.rev(node)) & REVIDX_PUNCHED_FLAG)):

1135

# this can happen if two branches make the same change

1135

# this can happen if two branches make the same change

1136

chain = node

1136

chain = node

1137

continue

1137

continue

1138

1139

for p in (p1, p2):

1139

for p in (p1, p2):

1140

if not p in self.nodemap:

1140

if not p in self.nodemap:

1141

if self._shallow:

1141

if self._shallow:

1142

# add null entries for missing parents

1142

# add null entries for missing parents

1143

# XXX FIXME

1143

# XXX FIXME

1144

#if base == nullrev:

1144

#if base == nullrev:

1145

# base = len(self)

1145

# base = len(self)

1146

#e = (offset_type(end, REVIDX_PUNCHED_FLAG),

1146

#e = (offset_type(end, REVIDX_PUNCHED_FLAG),

1147

# 0, 0, base, nullrev, nullrev, nullrev, p)

1147

# 0, 0, base, nullrev, nullrev, nullrev, p)

1148

#self.index.insert(-1, e)

1148

#self.index.insert(-1, e)

1149

#self.nodemap[p] = r

1149

#self.nodemap[p] = r

1150

#entry = self._io.packentry(e, self.node,

1150

#entry = self._io.packentry(e, self.node,

1151

# self.version, r)

1151

# self.version, r)

1152

#ifh.write(entry)

1152

#ifh.write(entry)

1153

#t, r = r, r + 1

1153

#t, r = r, r + 1

1154

raise LookupError(p, self.indexfile,

1154

raise LookupError(p, self.indexfile,

1155

_('unknown parent'))

1155

_('unknown parent'))

1156

else:

1156

else:

1157

raise LookupError(p, self.indexfile,

1157

raise LookupError(p, self.indexfile,

1158

_('unknown parent'))

1158

_('unknown parent'))

1159

1160

if not chain:

1160

if not chain:

1161

# retrieve the parent revision of the delta chain

1161

# retrieve the parent revision of the delta chain

1162

chain = p1

1162

chain = p1

1163

if not chain in self.nodemap:

1163

if not chain in self.nodemap:

1164

raise LookupError(chain, self.indexfile, _('unknown base'))

1164

raise LookupError(chain, self.indexfile, _('unknown base'))

1165

1166

chainrev = self.rev(chain)

1166

chainrev = self.rev(chain)

1167

chain = self._addrevision(node, None, transaction, link,

1167

chain = self._addrevision(node, None, transaction, link,

1168

p1, p2, (chainrev, delta), ifh, dfh)

1168

p1, p2, (chainrev, delta), ifh, dfh)

1169

if not dfh and not self._inline:

1169

if not dfh and not self._inline:

1170

# addrevision switched from inline to conventional

1170

# addrevision switched from inline to conventional

1171

# reopen the index

1171

# reopen the index

1172

dfh = self.opener(self.datafile, "a")

1172

dfh = self.opener(self.datafile, "a")

1173

ifh = self.opener(self.indexfile, "a")

1173

ifh = self.opener(self.indexfile, "a")

1174

finally:

1174

finally:

1175

if dfh:

1175

if dfh:

1176

dfh.close()

1176

dfh.close()

1177

ifh.close()

1177

ifh.close()

1178

1179

return node

1179

return node

1180

1181

def strip(self, minlink, transaction):

1181

def strip(self, minlink, transaction):

1182

"""truncate the revlog on the first revision with a linkrev >= minlink

1182

"""truncate the revlog on the first revision with a linkrev >= minlink

1183

1184

This function is called when we're stripping revision minlink and

1184

This function is called when we're stripping revision minlink and

1185

its descendants from the repository.

1185

its descendants from the repository.

1186

1187

We have to remove all revisions with linkrev >= minlink, because

1187

We have to remove all revisions with linkrev >= minlink, because

1188

the equivalent changelog revisions will be renumbered after the

1188

the equivalent changelog revisions will be renumbered after the

1189

strip.

1189

strip.

1190

1191

So we truncate the revlog on the first of these revisions, and

1191

So we truncate the revlog on the first of these revisions, and

1192

trust that the caller has saved the revisions that shouldn't be

1192

trust that the caller has saved the revisions that shouldn't be

1193

removed and that it'll readd them after this truncation.

1193

removed and that it'll readd them after this truncation.

1194

"""

1194

"""

1195

if len(self) == 0:

1195

if len(self) == 0:

1196

return

1196

return

1197

1198

for rev in self:

1198

for rev in self:

1199

if self.index[rev][4] >= minlink:

1199

if self.index[rev][4] >= minlink:

1200

break

1200

break

1201

else:

1201

else:

1202

return

1202

return

1203

1204

# first truncate the files on disk

1204

# first truncate the files on disk

1205

end = self.start(rev)

1205

end = self.start(rev)

1206

if not self._inline:

1206

if not self._inline:

1207

transaction.add(self.datafile, end)

1207

transaction.add(self.datafile, end)

1208

end = rev * self._io.size

1208

end = rev * self._io.size

1209

else:

1209

else:

1210

end += rev * self._io.size

1210

end += rev * self._io.size

1211

1212

transaction.add(self.indexfile, end)

1212

transaction.add(self.indexfile, end)

1213

1214

# then reset internal state in memory to forget those revisions

1214

# then reset internal state in memory to forget those revisions

1215

self._cache = None

1215

self._cache = None

1216

self._chunkclear()

1216

self._chunkclear()

1217

for x in xrange(rev, len(self)):

1217

for x in xrange(rev, len(self)):

1218

del self.nodemap[self.node(x)]

1218

del self.nodemap[self.node(x)]

1219

1220

del self.index[rev:-1]

1220

del self.index[rev:-1]

1221

1222

def checksize(self):

1222

def checksize(self):

1223

expected = 0

1223

expected = 0

1224

if len(self):

1224

if len(self):

1225

expected = max(0, self.end(len(self) - 1))

1225

expected = max(0, self.end(len(self) - 1))

1226

1227

try:

1227

try:

1228

f = self.opener(self.datafile)

1228

f = self.opener(self.datafile)

1229

f.seek(0, 2)

1229

f.seek(0, 2)

1230

actual = f.tell()

1230

actual = f.tell()

1231

dd = actual - expected

1231

dd = actual - expected

1232

except IOError, inst:

1232

except IOError, inst:

1233

if inst.errno != errno.ENOENT:

1233

if inst.errno != errno.ENOENT:

1234

raise

1234

raise

1235

dd = 0

1235

dd = 0

1236

1237

try:

1237

try:

1238

f = self.opener(self.indexfile)

1238

f = self.opener(self.indexfile)

1239

f.seek(0, 2)

1239

f.seek(0, 2)

1240

actual = f.tell()

1240

actual = f.tell()

1241

s = self._io.size

1241

s = self._io.size

1242

i = max(0, actual // s)

1242

i = max(0, actual // s)

1243

di = actual - (i * s)

1243

di = actual - (i * s)

1244

if self._inline:

1244

if self._inline:

1245

databytes = 0

1245

databytes = 0

1246

for r in self:

1246

for r in self:

1247

databytes += max(0, self.length(r))

1247

databytes += max(0, self.length(r))

1248

dd = 0

1248

dd = 0

1249

di = actual - len(self) * s - databytes

1249

di = actual - len(self) * s - databytes

1250

except IOError, inst:

1250

except IOError, inst:

1251

if inst.errno != errno.ENOENT:

1251

if inst.errno != errno.ENOENT:

1252

raise

1252

raise

1253

di = 0

1253

di = 0

1254

1255

return (dd, di)

1255

return (dd, di)

1256

1257

def files(self):

1257

def files(self):

1258

res = [self.indexfile]

1258

res = [self.indexfile]

1259

if not self._inline:

1259

if not self._inline:

1260

res.append(self.datafile)

1260

res.append(self.datafile)

1261

return res

1261

return res

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # revlog.py - storage back-end for mercurial
             #
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             # import stuff from node for others to import from revlog
             from node import bin, hex, nullid, nullrev, short #@UnusedImport
             from i18n import _
             import changegroup, ancestor, mdiff, parsers, error, util
             import struct, zlib, errno
             _pack = struct.pack
             _unpack = struct.unpack
             _compress = zlib.compress
             _decompress = zlib.decompress
             _sha = util.sha1
             # revlog header flags
             REVLOGV0 = 0
             REVLOGNG = 1
             REVLOGNGINLINEDATA = (1 << 16)
             REVLOGSHALLOW = (1 << 17)
             REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA
             REVLOG_DEFAULT_FORMAT = REVLOGNG
             REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS
             REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGSHALLOW
             # revlog index flags
             REVIDX_PARENTDELTA  = 1
             REVIDX_PUNCHED_FLAG = 2
             REVIDX_KNOWN_FLAGS = REVIDX_PUNCHED_FLAG | REVIDX_PARENTDELTA
             # max size of revlog with inline data
             _maxinline = 131072
             _chunksize = 1048576
             RevlogError = error.RevlogError
             LookupError = error.LookupError
             def getoffset(q):
                 return int(q >> 16)
             def gettype(q):
                 return int(q & 0xFFFF)
             def offset_type(offset, type):
                 return long(long(offset) << 16 | type)
             nullhash = _sha(nullid)
             def hash(text, p1, p2):
                 """generate a hash from the given text and its parent hashes
                 This hash combines both the current file contents and its history
                 in a manner that makes it easy to distinguish nodes with the same
                 content in the revision graph.
                 """
                 # As of now, if one of the parent node is null, p2 is null
                 if p2 == nullid:
                     # deep copy of a hash is faster than creating one
                     s = nullhash.copy()
                     s.update(p1)
                 else:
                     # none of the parent nodes are nullid
                     l = [p1, p2]
                     l.sort()
                     s = _sha(l[0])
                     s.update(l[1])
                 s.update(text)
                 return s.digest()
             def compress(text):
                 """ generate a possibly-compressed representation of text """
                 if not text:
                     return ("", text)
                 l = len(text)
                 bin = None
                 if l < 44:
                     pass
                 elif l > 1000000:
                     # zlib makes an internal copy, thus doubling memory usage for
                     # large files, so lets do this in pieces
                     z = zlib.compressobj()
                     p = []
                     pos = 0
                     while pos < l:
                         pos2 = pos + 2**20
                         p.append(z.compress(text[pos:pos2]))
                         pos = pos2
                     p.append(z.flush())
                     if sum(map(len, p)) < l:
                         bin = "".join(p)
                 else:
                     bin = _compress(text)
                 if bin is None or len(bin) > l:
                     if text[0] == '\0':
                         return ("", text)
                     return ('u', text)
                 return ("", bin)
             def decompress(bin):
                 """ decompress the given input """
                 if not bin:
                     return bin
                 t = bin[0]
                 if t == '\0':
                     return bin
                 if t == 'x':
                     return _decompress(bin)
                 if t == 'u':
                     return bin[1:]
                 raise RevlogError(_("unknown compression type %r") % t)
             indexformatv0 = ">4l20s20s20s"
             v0shaoffset = 56
             class revlogoldio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatv0)
                 def parseindex(self, data, inline):
                     s = self.size
                     index = []
                     nodemap =  {nullid: nullrev}
                     n = off = 0
                     l = len(data)
                     while off + s <= l:
                         cur = data[off:off + s]
                         off += s
                         e = _unpack(indexformatv0, cur)
                         # transform to revlogv1 format
                         e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],
                               nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])
                         index.append(e2)
                         nodemap[e[6]] = n
                         n += 1
                     # add the magic null revision at -1
                     index.append((0, 0, 0, -1, -1, -1, -1, nullid))
                     return index, nodemap, None
                 def packentry(self, entry, node, version, rev):
                     if gettype(entry[0]):
                         raise RevlogError(_("index entry flags need RevlogNG"))
                     e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],
                           node(entry[5]), node(entry[6]), entry[7])
                     return _pack(indexformatv0, *e2)
             # index ng:
             #  6 bytes: offset
             #  2 bytes: flags
             #  4 bytes: compressed length
             #  4 bytes: uncompressed length
             #  4 bytes: base rev
             #  4 bytes: link rev
             #  4 bytes: parent 1 rev
             #  4 bytes: parent 2 rev
             # 32 bytes: nodeid
             indexformatng = ">Qiiiiii20s12x"
             ngshaoffset = 32
             versionformat = ">I"
             class revlogio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatng)
                 def parseindex(self, data, inline):
                     # call the C implementation to parse the index data
                     index, cache = parsers.parse_index2(data, inline)
                     return index, None, cache
                 def packentry(self, entry, node, version, rev):
                     p = _pack(indexformatng, *entry)
                     if rev == 0:
                         p = _pack(versionformat, version) + p[4:]
                     return p
             class revlog(object):
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 """
                 def __init__(self, opener, indexfile, shallowroot=None):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     """
                     self.indexfile = indexfile
                     self.datafile = indexfile[:-2] + ".d"
                     self.opener = opener
                     self._cache = None
                     self._chunkcache = (0, '')
                     self.index = []
                     self._shallowroot = shallowroot
                     self._parentdelta = 0
                     self._pcache = {}
                     self._nodecache = {nullid: nullrev}
                     self._nodepos = None
                     v = REVLOG_DEFAULT_VERSION
                     if hasattr(opener, 'options') and 'defversion' in opener.options:
                         v = opener.options['defversion']
                         if v & REVLOGNG:
                             v |= REVLOGNGINLINEDATA
                         if v & REVLOGNG and 'parentdelta' in opener.options:
                             self._parentdelta = 1
                     if shallowroot:
                         v |= REVLOGSHALLOW
                     i = ''
                     try:
                         f = self.opener(self.indexfile)
                         i = f.read()
                         if len(i) > 0:
                             v = struct.unpack(versionformat, i[:4])[0]
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                     self.version = v
                     self._inline = v & REVLOGNGINLINEDATA
                     self._shallow = v & REVLOGSHALLOW
                     flags = v & ~0xFFFF
                     fmt = v & 0xFFFF
                     if fmt == REVLOGV0 and flags:
                         raise RevlogError(_("index %s unknown flags %#04x for format v0")
                                           % (self.indexfile, flags >> 16))
                     elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:
                         raise RevlogError(_("index %s unknown flags %#04x for revlogng")
                                           % (self.indexfile, flags >> 16))
                     elif fmt > REVLOGNG:
                         raise RevlogError(_("index %s unknown format %d")
                                           % (self.indexfile, fmt))
                     self._io = revlogio()
                     if self.version == REVLOGV0:
                         self._io = revlogoldio()
                     try:
                         d = self._io.parseindex(i, self._inline)
                     except (ValueError, IndexError):
                         raise RevlogError(_("index %s is corrupted") % (self.indexfile))
                     self.index, nodemap, self._chunkcache = d
                     if nodemap is not None:
                         self.nodemap = self._nodecache = nodemap
                     if not self._chunkcache:
                         self._chunkclear()
                 def tip(self):
                     return self.node(len(self.index) - 2)
                 def __len__(self):
                     return len(self.index) - 1
                 def __iter__(self):
                     for i in xrange(len(self)):
                         yield i
                 @util.propertycache
                 def nodemap(self):
                     n = self.rev(self.node(0))
                     return self._nodecache
                 def rev(self, node):
                     try:
                         return self._nodecache[node]
                     except KeyError:
                         n = self._nodecache
                         if node in n:
                             return n[node]
                         i = self.index
                         p = self._nodepos
                         if p is None:
                             p = len(i) - 2
                         for r in xrange(p, -1, -1):
                             v = i[r][7]
                             n[v] = r
                             if v == node:
                                 self._nodepos = r - 1
                                 return r
                         raise LookupError(node, self.indexfile, _('no node'))
                 def node(self, rev):
                     return self.index[rev][7]
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline
                 def parentrevs(self, rev):
                     return self.index[rev][5:7]
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def length(self, rev):
                     return self.index[rev][1]
                 def base(self, rev):
                     return self.index[rev][3]
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.revision(self.node(rev))
                     return len(t)
                 size = rawsize
                 def reachable(self, node, stop=None):
                     """return the set of all nodes ancestral to a given node, including
                      the node itself, stopping when stop is matched"""
                     reachable = set((node,))
                     visit = [node]
                     if stop:
                         stopn = self.rev(stop)
                     else:
                         stopn = 0
                     while visit:
                         n = visit.pop(0)
                         if n == stop:
                             continue
                         if n == nullid:
                             continue
                         for p in self.parents(n):
                             if self.rev(p) < stopn:
                                 continue
                             if p not in reachable:
                                 reachable.add(p)
                                 visit.append(p)
                     return reachable
                 def ancestors(self, *revs):
                     """Generate the ancestors of 'revs' in reverse topological order.
                     Yield a sequence of revision numbers starting with the parents
                     of each revision in revs, i.e., each revision is *not* considered
                     an ancestor of itself.  Results are in breadth-first order:
                     parents of each rev in revs, then parents of those, etc.  Result
                     does not include the null revision."""
                     visit = list(revs)
                     seen = set([nullrev])
                     while visit:
                         for parent in self.parentrevs(visit.pop(0)):
                             if parent not in seen:
                                 visit.append(parent)
                                 seen.add(parent)
                                 yield parent
                 def descendants(self, *revs):
                     """Generate the descendants of 'revs' in revision order.
                     Yield a sequence of revision numbers starting with a child of
                     some rev in revs, i.e., each revision is *not* considered a
                     descendant of itself.  Results are ordered by revision number (a
                     topological sort)."""
                     first = min(revs)
                     if first == nullrev:
                         for i in self:
                             yield i
                         return
                     seen = set(revs)
                     for i in xrange(first + 1, len(self)):
                         for x in self.parentrevs(i):
                             if x != nullrev and x in seen:
                                 seen.add(i)
                                 yield i
                                 break
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     has = set(self.ancestors(*common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = [r for r in heads if r not in has]
                     while visit:
                         r = visit.pop(0)
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return [self.node(r) for r in missing]
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [nullid] # Everybody's a descendent of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return ([self.node(r) for r in self], [nullid], list(self.heads()))
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, 0)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendent of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n) # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update([p for p in self.parents(n) if
                                                        p != nullid])
                                 elif n in heads: # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [n for n in roots if n in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(n) for n in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [nullid]
                     # Transform our roots list into a set.
                     descendents = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendents.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descedents, empty parents will look like
                     # they're descendents.
                     for r in xrange(max(lowestrev, 0), highestrev + 1):
                         n = self.node(r)
                         isdescendent = False
                         if lowestrev == nullrev:  # Everybody is a descendent of nullid
                             isdescendent = True
                         elif n in descendents:
                             # n is already a descendent
                             isdescendent = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendents before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendents, it's not a root.
                                 if (p[0] in descendents) or (p[1] in descendents):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendent if either of its parents are
                             # descendents.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendents) or (p[1] in descendents):
                                 descendents.add(n)
                                 isdescendent = True
                         if isdescendent and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendents and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = 1
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = 1
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [n for n in heads.iterkeys() if heads[n] != 0]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         count = len(self)
                         if not count:
                             return [nullid]
                         ishead = [1] * (count + 1)
                         index = self.index
                         for r in xrange(count):
                             e = index[r]
                             ishead[e[5]] = ishead[e[6]] = 0
                         return [self.node(r) for r in xrange(count) if ishead[r]]
                     if start is None:
                         start = nullid
                     if stop is None:
                         stop = []
                     stoprevs = set([self.rev(n) for n in stop])
                     startrev = self.rev(start)
                     reachable = set((startrev,))
                     heads = set((startrev,))
                     parentrevs = self.parentrevs
                     for r in xrange(startrev + 1, len(self)):
                         for p in parentrevs(r):
                             if p in reachable:
                                 if r not in stoprevs:
                                     reachable.add(r)
                                 heads.add(r)
                             if p in heads and p not in stoprevs:
                                 heads.remove(p)
                     return [self.node(r) for r in heads]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in range(p + 1, len(self)):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def descendant(self, start, end):
                     if start == nullrev:
                         return True
                     for i in self.descendants(start):
                         if i == end:
                             return True
                         elif i > end:
                             break
                     return False
                 def ancestor(self, a, b):
                     """calculate the least common ancestor of nodes a and b"""
                     # fast path, check if it is a descendant
                     a, b = self.rev(a), self.rev(b)
                     start, end = sorted((a, b))
                     if self.descendant(start, end):
                         return self.node(start)
                     def parents(rev):
                         return [p for p in self.parentrevs(rev) if p != nullrev]
                     c = ancestor.ancestor(a, b, parents)
                     if c is None:
                         return nullid
                     return self.node(c)
                 def _match(self, id):
                     if isinstance(id, (long, int)):
                         # rev
                         return self.node(id)
                     if len(id) == 20:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node) # quick search the index
                             return node
                         except LookupError:
                             pass # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if str(rev) != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 40:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (TypeError, LookupError):
                             pass
                 def _partialmatch(self, id):
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) < 40:
                         try:
                             # hex(node)[:...]
                             l = len(id) // 2  # grab an even number of digits
                             prefix = bin(id[:l * 2])
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [n for n in nl if hex(n).startswith(id)]
                             if len(nl) > 0:
                                 if len(nl) == 1:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise LookupError(id, self.indexfile,
                                                   _('ambiguous identifier'))
                             return None
                         except TypeError:
                             pass
                 def lookup(self, id):
                     """locate a node based on:
                         - revision number or str(revision number)
                         - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise LookupError(id, self.indexfile, _('no match found'))
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return hash(text, p1, p2) != node
                 def _addchunk(self, offset, data):
                     o, d = self._chunkcache
                     # try to add to existing cache
                     if o + len(d) == offset and len(d) + len(data) < _chunksize:
                         self._chunkcache = o, d + data
                     else:
                         self._chunkcache = offset, data
                 def _loadchunk(self, offset, length):
                     if self._inline:
                         df = self.opener(self.indexfile)
                     else:
                         df = self.opener(self.datafile)
                     readahead = max(65536, length)
                     df.seek(offset)
                     d = df.read(readahead)
                     self._addchunk(offset, d)
                     if readahead > length:
                         return d[:length]
                     return d
                 def _getchunk(self, offset, length):
                     o, d = self._chunkcache
                     l = len(d)
                     # is it in the cache?
                     cachestart = offset - o
                     cacheend = cachestart + length
                     if cachestart >= 0 and cacheend <= l:
                         if cachestart == 0 and cacheend == l:
                             return d # avoid a copy
                         return d[cachestart:cacheend]
                     return self._loadchunk(offset, length)
                 def _chunkraw(self, startrev, endrev):
                     start = self.start(startrev)
                     length = self.end(endrev) - start
                     if self._inline:
                         start += (startrev + 1) * self._io.size
                     return self._getchunk(start, length)
                 def _chunk(self, rev):
                     return decompress(self._chunkraw(rev, rev))
                 def _chunkclear(self):
                     self._chunkcache = (0, '')
                 def deltaparent(self, rev):
                     """return previous revision or parentrev according to flags"""
                     if self.flags(rev) & REVIDX_PARENTDELTA:
                         return self.parentrevs(rev)[0]
                     else:
                         return rev - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions"""
                     if self.base(rev2) != rev2 and self.deltaparent(rev2) == rev1:
                         return self._chunk(rev2)
                     return mdiff.textdiff(self.revision(self.node(rev1)),
                                           self.revision(self.node(rev2)))
                 def revision(self, node):
                     """return an uncompressed revision of a given node"""
                     cachedrev = None
                     if node == nullid:
                         return ""
                     if self._cache:
                         if self._cache[0] == node:
                             return self._cache[2]
                         cachedrev = self._cache[1]
                     # look up what we need to read
                     text = None
                     rev = self.rev(node)
                     base = self.base(rev)
                     # check rev flags
                     if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:
                         raise RevlogError(_('incompatible revision flag %x') %
                                           (self.flags(rev) & ~REVIDX_KNOWN_FLAGS))
                     # build delta chain
                     chain = []
                     index = self.index # for performance
                     iterrev = rev
                     e = index[iterrev]
                     while iterrev != base and iterrev != cachedrev:
                         chain.append(iterrev)
                         if e[0] & REVIDX_PARENTDELTA:
                             iterrev = e[5]
                         else:
                             iterrev -= 1
                         e = index[iterrev]
                     chain.reverse()
                     base = iterrev
                     if iterrev == cachedrev:
                         # cache hit
                         text = self._cache[2]
                     # drop cache to save memory
                     self._cache = None
                     self._chunkraw(base, rev)
                     if text is None:
                         text = self._chunk(base)
                     bins = [self._chunk(r) for r in chain]
                     text = mdiff.patches(text, bins)
-                    text = self._checkhash(text, node)
+                    text = self._checkhash(text, node, rev)
                     self._cache = (node, rev, text)
                     return text
-                def _checkhash(self, text, node):
+                def _checkhash(self, text, node, rev):
                     p1, p2 = self.parents(node)
                     if (node != hash(text, p1, p2) and
                         not (self.flags(rev) & REVIDX_PUNCHED_FLAG)):
                         raise RevlogError(_("integrity check failed on %s:%d")
                                           % (self.indexfile, rev))
                     return text
                 def checkinlinesize(self, tr, fp=None):
                     if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:
                         return
                     trinfo = tr.find(self.indexfile)
                     if trinfo is None:
                         raise RevlogError(_("%s not found in the transaction")
                                           % self.indexfile)
                     trindex = trinfo[2]
                     dataoff = self.start(trindex)
                     tr.add(self.datafile, dataoff)
                     if fp:
                         fp.flush()
                         fp.close()
                     df = self.opener(self.datafile, 'w')
                     try:
                         for r in self:
                             df.write(self._chunkraw(r, r))
                     finally:
                         df.close()
                     fp = self.opener(self.indexfile, 'w', atomictemp=True)
                     self.version &= ~(REVLOGNGINLINEDATA)
                     self._inline = False
                     for i in self:
                         e = self._io.packentry(self.index[i], self.node, self.version, i)
                         fp.write(e)
                     # if we don't call rename, the temp file will never replace the
                     # real index
                     fp.rename()
                     tr.replace(self.indexfile, trindex * self._io.size)
                     self._chunkclear()
                 def addrevision(self, text, transaction, link, p1, p2, cachedelta=None):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     """
                     node = hash(text, p1, p2)
                     if (node in self.nodemap and
                         (not self.flags(self.rev(node)) & REVIDX_PUNCHED_FLAG)):
                         return node
                     dfh = None
                     if not self._inline:
                         dfh = self.opener(self.datafile, "a")
                     ifh = self.opener(self.indexfile, "a+")
                     try:
                         return self._addrevision(node, text, transaction, link, p1, p2,
                                                  cachedelta, ifh, dfh)
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                 def _addrevision(self, node, text, transaction, link, p1, p2,
                                  cachedelta, ifh, dfh):
                     btext = [text]
                     def buildtext():
                         if btext[0] is not None:
                             return btext[0]
                         # flush any pending writes here so we can read it in revision
                         if dfh:
                             dfh.flush()
                         ifh.flush()
                         basetext = self.revision(self.node(cachedelta[0]))
                         btext[0] = mdiff.patch(basetext, cachedelta[1])
                         chk = hash(btext[0], p1, p2)
                         if chk != node:
                             raise RevlogError(_("consistency error in delta"))
                         return btext[0]
                     def builddelta(rev):
                         # can we use the cached delta?
                         if cachedelta and cachedelta[0] == rev:
                             delta = cachedelta[1]
                         else:
                             t = buildtext()
                             ptext = self.revision(self.node(rev))
                             delta = mdiff.textdiff(ptext, t)
                         data = compress(delta)
                         l = len(data[1]) + len(data[0])
                         base = self.base(rev)
                         dist = l + offset - self.start(base)
                         return dist, l, data, base
                     curr = len(self)
                     prev = curr - 1
                     base = curr
                     offset = self.end(prev)
                     flags = 0
                     d = None
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # should we try to build a delta?
                     if prev != nullrev:
                         d = builddelta(prev)
                         if self._parentdelta and prev != p1r:
                             d2 = builddelta(p1r)
                             if d2 < d:
                                 d = d2
                                 flags = REVIDX_PARENTDELTA
                         dist, l, data, base = d
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     # or the base revision is punched
                     if text is None:
                         textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),
                                                     cachedelta[1])
                     else:
                         textlen = len(text)
                     if (d is None or dist > textlen * 2 or
                         (self.flags(base) & REVIDX_PUNCHED_FLAG)):
                         text = buildtext()
                         data = compress(text)
                         l = len(data[1]) + len(data[0])
                         base = curr
                     e = (offset_type(offset, flags), l, textlen,
                          base, link, p1r, p2r, node)
                     self.index.insert(-1, e)
                     self.nodemap[node] = curr
                     entry = self._io.packentry(e, self.node, self.version, curr)
                     if not self._inline:
                         transaction.add(self.datafile, offset)
                         transaction.add(self.indexfile, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         dfh.flush()
                         ifh.write(entry)
                     else:
                         offset += curr * self._io.size
                         transaction.add(self.indexfile, offset, curr)
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                         self.checkinlinesize(transaction, ifh)
                     if type(text) == str: # only accept immutable objects
                         self._cache = (node, curr, text)
                     return node
                 def group(self, nodelist, lookup, infocollect=None, fullrev=False):
                     """Calculate a delta group, yielding a sequence of changegroup chunks
                     (strings).
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. The first delta is
                     first parent(nodelist[0]) -> nodelist[0], the receiver is
                     guaranteed to have this parent as it has all history before
                     these changesets. In the case firstparent is nullrev the
                     changegroup starts with a full revision.
                     fullrev forces the insertion of the full revision, necessary
                     in the case of shallow clones where the first parent might
                     not exist at the reciever.
                     """
                     revs = [self.rev(n) for n in nodelist]
                     # if we don't have any revisions touched by these changesets, bail
                     if not revs:
                         yield changegroup.closechunk()
                         return
                     # add the parent of the first rev
                     p = self.parentrevs(revs[0])[0]
                     revs.insert(0, p)
                     if p == nullrev:
                         fullrev = True
                     # build deltas
                     for d in xrange(len(revs) - 1):
                         a, b = revs[d], revs[d + 1]
                         nb = self.node(b)
                         if infocollect is not None:
                             infocollect(nb)
                         p = self.parents(nb)
                         meta = nb + p[0] + p[1] + lookup(nb)
                         if fullrev:
                             d = self.revision(nb)
                             meta += mdiff.trivialdiffheader(len(d))
                             fullrev = False
                         else:
                             d = self.revdiff(a, b)
                         yield changegroup.chunkheader(len(meta) + len(d))
                         yield meta
                         yield d
                     yield changegroup.closechunk()
                 def addgroup(self, bundle, linkmapper, transaction):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     """
                     # track the base of the current delta log
                     node = None
                     r = len(self)
                     end = 0
                     if r:
                         end = self.end(r - 1)
                     ifh = self.opener(self.indexfile, "a+")
                     isize = r * self._io.size
                     if self._inline:
                         transaction.add(self.indexfile, end + isize, r)
                         dfh = None
                     else:
                         transaction.add(self.indexfile, isize, r)
                         transaction.add(self.datafile, end)
                         dfh = self.opener(self.datafile, "a")
                     try:
                         # loop through our set of deltas
                         chain = None
                         while 1:
                             chunkdata = bundle.parsechunk()
                             if not chunkdata:
                                 break
                             node = chunkdata['node']
                             p1 = chunkdata['p1']
                             p2 = chunkdata['p2']
                             cs = chunkdata['cs']
                             delta = chunkdata['data']
                             link = linkmapper(cs)
                             if (node in self.nodemap and
                                 (not self.flags(self.rev(node)) & REVIDX_PUNCHED_FLAG)):
                                 # this can happen if two branches make the same change
                                 chain = node
                                 continue
                             for p in (p1, p2):
                                 if not p in self.nodemap:
                                     if self._shallow:
                                         # add null entries for missing parents
                                         # XXX FIXME
                                         #if base == nullrev:
                                         #    base = len(self)
                                         #e = (offset_type(end, REVIDX_PUNCHED_FLAG),
                                         #     0, 0, base, nullrev, nullrev, nullrev, p)
                                         #self.index.insert(-1, e)
                                         #self.nodemap[p] = r
                                         #entry = self._io.packentry(e, self.node,
                                         #                           self.version, r)
                                         #ifh.write(entry)
                                         #t, r = r, r + 1
                                         raise LookupError(p, self.indexfile,
                                                           _('unknown parent'))
                                     else:
                                         raise LookupError(p, self.indexfile,
                                                           _('unknown parent'))
                             if not chain:
                                 # retrieve the parent revision of the delta chain
                                 chain = p1
                                 if not chain in self.nodemap:
                                     raise LookupError(chain, self.indexfile, _('unknown base'))
                             chainrev = self.rev(chain)
                             chain = self._addrevision(node, None, transaction, link,
                                                       p1, p2, (chainrev, delta), ifh, dfh)
                             if not dfh and not self._inline:
                                 # addrevision switched from inline to conventional
                                 # reopen the index
                                 dfh = self.opener(self.datafile, "a")
                                 ifh = self.opener(self.indexfile, "a")
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                     return node
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll readd them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     for rev in self:
                         if self.index[rev][4] >= minlink:
                             break
                     else:
                         return
                     # first truncate the files on disk
                     end = self.start(rev)
                     if not self._inline:
                         transaction.add(self.datafile, end)
                         end = rev * self._io.size
                     else:
                         end += rev * self._io.size
                     transaction.add(self.indexfile, end)
                     # then reset internal state in memory to forget those revisions
                     self._cache = None
                     self._chunkclear()
                     for x in xrange(rev, len(self)):
                         del self.nodemap[self.node(x)]
                     del self.index[rev:-1]
                 def checksize(self):
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         f = self.opener(self.datafile)
                         f.seek(0, 2)
                         actual = f.tell()
                         dd = actual - expected
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         dd = 0
                     try:
                         f = self.opener(self.indexfile)
                         f.seek(0, 2)
                         actual = f.tell()
                         s = self._io.size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         di = 0
                     return (dd, di)
                 def files(self):
                     res = [self.indexfile]
                     if not self._inline:
                         res.append(self.datafile)
                     return res