upstream/mercurial-mirror Commit - r14296:62e25c63

1

# revlog.py - storage back-end for mercurial

1

# revlog.py - storage back-end for mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

"""Storage back-end for Mercurial.

8

"""Storage back-end for Mercurial.

9

10

This provides efficient delta storage with O(1) retrieve and append

10

This provides efficient delta storage with O(1) retrieve and append

11

and O(changes) merge between branches.

11

and O(changes) merge between branches.

12

"""

12

"""

13

14

# import stuff from node for others to import from revlog

14

# import stuff from node for others to import from revlog

15

from node import bin, hex, nullid, nullrev, short #@UnusedImport

15

from node import bin, hex, nullid, nullrev, short #@UnusedImport

16

from i18n import _

16

from i18n import _

17

import ancestor, mdiff, parsers, error, util

17

import ancestor, mdiff, parsers, error, util

18

import struct, zlib, errno

18

import struct, zlib, errno

19

20

_pack = struct.pack

20

_pack = struct.pack

21

_unpack = struct.unpack

21

_unpack = struct.unpack

22

_compress = zlib.compress

22

_compress = zlib.compress

23

_decompress = zlib.decompress

23

_decompress = zlib.decompress

24

_sha = util.sha1

24

_sha = util.sha1

25

26

# revlog header flags

26

# revlog header flags

27

REVLOGV0 = 0

27

REVLOGV0 = 0

28

REVLOGNG = 1

28

REVLOGNG = 1

29

REVLOGNGINLINEDATA = (1 << 16)

29

REVLOGNGINLINEDATA = (1 << 16)

30

REVLOGGENERALDELTA = (1 << 17)

30

REVLOGGENERALDELTA = (1 << 17)

31

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

31

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

32

REVLOG_DEFAULT_FORMAT = REVLOGNG

32

REVLOG_DEFAULT_FORMAT = REVLOGNG

33

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

33

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

34

REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGGENERALDELTA

34

REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGGENERALDELTA

35

36

# revlog index flags

36

# revlog index flags

37

REVIDX_KNOWN_FLAGS = 0

37

REVIDX_KNOWN_FLAGS = 0

38

39

# max size of revlog with inline data

39

# max size of revlog with inline data

40

_maxinline = 131072

40

_maxinline = 131072

41

_chunksize = 1048576

41

_chunksize = 1048576

42

43

RevlogError = error.RevlogError

43

RevlogError = error.RevlogError

44

LookupError = error.LookupError

44

LookupError = error.LookupError

45

46

def getoffset(q):

46

def getoffset(q):

47

return int(q >> 16)

47

return int(q >> 16)

48

49

def gettype(q):

49

def gettype(q):

50

return int(q & 0xFFFF)

50

return int(q & 0xFFFF)

51

52

def offset_type(offset, type):

52

def offset_type(offset, type):

53

return long(long(offset) << 16 | type)

53

return long(long(offset) << 16 | type)

54

55

nullhash = _sha(nullid)

55

nullhash = _sha(nullid)

56

57

def hash(text, p1, p2):

57

def hash(text, p1, p2):

58

"""generate a hash from the given text and its parent hashes

58

"""generate a hash from the given text and its parent hashes

59

60

This hash combines both the current file contents and its history

60

This hash combines both the current file contents and its history

61

in a manner that makes it easy to distinguish nodes with the same

61

in a manner that makes it easy to distinguish nodes with the same

62

content in the revision graph.

62

content in the revision graph.

63

"""

63

"""

64

# As of now, if one of the parent node is null, p2 is null

64

# As of now, if one of the parent node is null, p2 is null

65

if p2 == nullid:

65

if p2 == nullid:

66

# deep copy of a hash is faster than creating one

66

# deep copy of a hash is faster than creating one

67

s = nullhash.copy()

67

s = nullhash.copy()

68

s.update(p1)

68

s.update(p1)

69

else:

69

else:

70

# none of the parent nodes are nullid

70

# none of the parent nodes are nullid

71

l = [p1, p2]

71

l = [p1, p2]

72

l.sort()

72

l.sort()

73

s = _sha(l[0])

73

s = _sha(l[0])

74

s.update(l[1])

74

s.update(l[1])

75

s.update(text)

75

s.update(text)

76

return s.digest()

76

return s.digest()

77

78

def compress(text):

78

def compress(text):

79

""" generate a possibly-compressed representation of text """

79

""" generate a possibly-compressed representation of text """

80

if not text:

80

if not text:

81

return ("", text)

81

return ("", text)

82

l = len(text)

82

l = len(text)

83

bin = None

83

bin = None

84

if l < 44:

84

if l < 44:

85

pass

85

pass

86

elif l > 1000000:

86

elif l > 1000000:

87

# zlib makes an internal copy, thus doubling memory usage for

87

# zlib makes an internal copy, thus doubling memory usage for

88

# large files, so lets do this in pieces

88

# large files, so lets do this in pieces

89

z = zlib.compressobj()

89

z = zlib.compressobj()

90

p = []

90

p = []

91

pos = 0

91

pos = 0

92

while pos < l:

92

while pos < l:

93

pos2 = pos + 2**20

93

pos2 = pos + 2**20

94

p.append(z.compress(text[pos:pos2]))

94

p.append(z.compress(text[pos:pos2]))

95

pos = pos2

95

pos = pos2

96

p.append(z.flush())

96

p.append(z.flush())

97

if sum(map(len, p)) < l:

97

if sum(map(len, p)) < l:

98

bin = "".join(p)

98

bin = "".join(p)

99

else:

99

else:

100

bin = _compress(text)

100

bin = _compress(text)

101

if bin is None or len(bin) > l:

101

if bin is None or len(bin) > l:

102

if text[0] == '\0':

102

if text[0] == '\0':

103

return ("", text)

103

return ("", text)

104

return ('u', text)

104

return ('u', text)

105

return ("", bin)

105

return ("", bin)

106

107

def decompress(bin):

107

def decompress(bin):

108

""" decompress the given input """

108

""" decompress the given input """

109

if not bin:

109

if not bin:

110

return bin

110

return bin

111

t = bin[0]

111

t = bin[0]

112

if t == '\0':

112

if t == '\0':

113

return bin

113

return bin

114

if t == 'x':

114

if t == 'x':

115

return _decompress(bin)

115

return _decompress(bin)

116

if t == 'u':

116

if t == 'u':

117

return bin[1:]

117

return bin[1:]

118

raise RevlogError(_("unknown compression type %r") % t)

118

raise RevlogError(_("unknown compression type %r") % t)

119

120

indexformatv0 = ">4l20s20s20s"

120

indexformatv0 = ">4l20s20s20s"

121

v0shaoffset = 56

121

v0shaoffset = 56

122

123

class revlogoldio(object):

123

class revlogoldio(object):

124

def __init__(self):

124

def __init__(self):

125

self.size = struct.calcsize(indexformatv0)

125

self.size = struct.calcsize(indexformatv0)

126

127

def parseindex(self, data, inline):

127

def parseindex(self, data, inline):

128

s = self.size

128

s = self.size

129

index = []

129

index = []

130

nodemap = {nullid: nullrev}

130

nodemap = {nullid: nullrev}

131

n = off = 0

131

n = off = 0

132

l = len(data)

132

l = len(data)

133

while off + s <= l:

133

while off + s <= l:

134

cur = data[off:off + s]

134

cur = data[off:off + s]

135

off += s

135

off += s

136

e = _unpack(indexformatv0, cur)

136

e = _unpack(indexformatv0, cur)

137

# transform to revlogv1 format

137

# transform to revlogv1 format

138

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

138

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

139

nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])

139

nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])

140

index.append(e2)

140

index.append(e2)

141

nodemap[e[6]] = n

141

nodemap[e[6]] = n

142

n += 1

142

n += 1

143

144

# add the magic null revision at -1

144

# add the magic null revision at -1

145

index.append((0, 0, 0, -1, -1, -1, -1, nullid))

145

index.append((0, 0, 0, -1, -1, -1, -1, nullid))

146

147

return index, nodemap, None

147

return index, nodemap, None

148

149

def packentry(self, entry, node, version, rev):

149

def packentry(self, entry, node, version, rev):

150

if gettype(entry[0]):

150

if gettype(entry[0]):

151

raise RevlogError(_("index entry flags need RevlogNG"))

151

raise RevlogError(_("index entry flags need RevlogNG"))

152

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

152

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

153

node(entry[5]), node(entry[6]), entry[7])

153

node(entry[5]), node(entry[6]), entry[7])

154

return _pack(indexformatv0, *e2)

154

return _pack(indexformatv0, *e2)

155

156

# index ng:

156

# index ng:

157

# 6 bytes: offset

157

# 6 bytes: offset

158

# 2 bytes: flags

158

# 2 bytes: flags

159

# 4 bytes: compressed length

159

# 4 bytes: compressed length

160

# 4 bytes: uncompressed length

160

# 4 bytes: uncompressed length

161

# 4 bytes: base rev

161

# 4 bytes: base rev

162

# 4 bytes: link rev

162

# 4 bytes: link rev

163

# 4 bytes: parent 1 rev

163

# 4 bytes: parent 1 rev

164

# 4 bytes: parent 2 rev

164

# 4 bytes: parent 2 rev

165

# 32 bytes: nodeid

165

# 32 bytes: nodeid

166

indexformatng = ">Qiiiiii20s12x"

166

indexformatng = ">Qiiiiii20s12x"

167

ngshaoffset = 32

167

ngshaoffset = 32

168

versionformat = ">I"

168

versionformat = ">I"

169

170

class revlogio(object):

170

class revlogio(object):

171

def __init__(self):

171

def __init__(self):

172

self.size = struct.calcsize(indexformatng)

172

self.size = struct.calcsize(indexformatng)

173

174

def parseindex(self, data, inline):

174

def parseindex(self, data, inline):

175

# call the C implementation to parse the index data

175

# call the C implementation to parse the index data

176

index, cache = parsers.parse_index2(data, inline)

176

index, cache = parsers.parse_index2(data, inline)

177

return index, None, cache

177

return index, None, cache

178

179

def packentry(self, entry, node, version, rev):

179

def packentry(self, entry, node, version, rev):

180

p = _pack(indexformatng, *entry)

180

p = _pack(indexformatng, *entry)

181

if rev == 0:

181

if rev == 0:

182

p = _pack(versionformat, version) + p[4:]

182

p = _pack(versionformat, version) + p[4:]

183

return p

183

return p

184

185

class revlog(object):

185

class revlog(object):

186

"""

186

"""

187

the underlying revision storage object

187

the underlying revision storage object

188

189

A revlog consists of two parts, an index and the revision data.

189

A revlog consists of two parts, an index and the revision data.

190

191

The index is a file with a fixed record size containing

191

The index is a file with a fixed record size containing

192

information on each revision, including its nodeid (hash), the

192

information on each revision, including its nodeid (hash), the

193

nodeids of its parents, the position and offset of its data within

193

nodeids of its parents, the position and offset of its data within

194

the data file, and the revision it's based on. Finally, each entry

194

the data file, and the revision it's based on. Finally, each entry

195

contains a linkrev entry that can serve as a pointer to external

195

contains a linkrev entry that can serve as a pointer to external

196

data.

196

data.

197

198

The revision data itself is a linear collection of data chunks.

198

The revision data itself is a linear collection of data chunks.

199

Each chunk represents a revision and is usually represented as a

199

Each chunk represents a revision and is usually represented as a

200

delta against the previous chunk. To bound lookup time, runs of

200

delta against the previous chunk. To bound lookup time, runs of

201

deltas are limited to about 2 times the length of the original

201

deltas are limited to about 2 times the length of the original

202

version data. This makes retrieval of a version proportional to

202

version data. This makes retrieval of a version proportional to

203

its size, or O(1) relative to the number of revisions.

203

its size, or O(1) relative to the number of revisions.

204

205

Both pieces of the revlog are written to in an append-only

205

Both pieces of the revlog are written to in an append-only

206

fashion, which means we never need to rewrite a file to insert or

206

fashion, which means we never need to rewrite a file to insert or

207

remove data, and can use some simple techniques to avoid the need

207

remove data, and can use some simple techniques to avoid the need

208

for locking while reading.

208

for locking while reading.

209

"""

209

"""

210

def __init__(self, opener, indexfile):

210

def __init__(self, opener, indexfile):

211

"""

211

"""

212

create a revlog object

212

create a revlog object

213

214

opener is a function that abstracts the file opening operation

214

opener is a function that abstracts the file opening operation

215

and can be used to implement COW semantics or the like.

215

and can be used to implement COW semantics or the like.

216

"""

216

"""

217

self.indexfile = indexfile

217

self.indexfile = indexfile

218

self.datafile = indexfile[:-2] + ".d"

218

self.datafile = indexfile[:-2] + ".d"

219

self.opener = opener

219

self.opener = opener

220

self._cache = None

220

self._cache = None

221

self._basecache = ~~None~~

221

self._basecache = (0, 0)

222

self._chunkcache = (0, '')

222

self._chunkcache = (0, '')

223

self.index = []

223

self.index = []

224

self._pcache = {}

224

self._pcache = {}

225

self._nodecache = {nullid: nullrev}

225

self._nodecache = {nullid: nullrev}

226

self._nodepos = None

226

self._nodepos = None

227

228

v = REVLOG_DEFAULT_VERSION

228

v = REVLOG_DEFAULT_VERSION

229

if hasattr(opener, 'options'):

229

if hasattr(opener, 'options'):

230

if 'defversion' in opener.options:

230

if 'defversion' in opener.options:

231

v = opener.options['defversion']

231

v = opener.options['defversion']

232

if v & REVLOGNG:

232

if v & REVLOGNG:

233

v |= REVLOGNGINLINEDATA

233

v |= REVLOGNGINLINEDATA

234

if v & REVLOGNG and 'generaldelta' in opener.options:

234

if v & REVLOGNG and 'generaldelta' in opener.options:

235

v |= REVLOGGENERALDELTA

235

v |= REVLOGGENERALDELTA

236

237

i = ''

237

i = ''

238

try:

238

try:

239

f = self.opener(self.indexfile)

239

f = self.opener(self.indexfile)

240

i = f.read()

240

i = f.read()

241

f.close()

241

f.close()

242

if len(i) > 0:

242

if len(i) > 0:

243

v = struct.unpack(versionformat, i[:4])[0]

243

v = struct.unpack(versionformat, i[:4])[0]

244

except IOError, inst:

244

except IOError, inst:

245

if inst.errno != errno.ENOENT:

245

if inst.errno != errno.ENOENT:

246

raise

246

raise

247

248

self.version = v

248

self.version = v

249

self._inline = v & REVLOGNGINLINEDATA

249

self._inline = v & REVLOGNGINLINEDATA

250

self._generaldelta = v & REVLOGGENERALDELTA

250

self._generaldelta = v & REVLOGGENERALDELTA

251

flags = v & ~0xFFFF

251

flags = v & ~0xFFFF

252

fmt = v & 0xFFFF

252

fmt = v & 0xFFFF

253

if fmt == REVLOGV0 and flags:

253

if fmt == REVLOGV0 and flags:

254

raise RevlogError(_("index %s unknown flags %#04x for format v0")

254

raise RevlogError(_("index %s unknown flags %#04x for format v0")

255

% (self.indexfile, flags >> 16))

255

% (self.indexfile, flags >> 16))

256

elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:

256

elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:

257

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

257

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

258

% (self.indexfile, flags >> 16))

258

% (self.indexfile, flags >> 16))

259

elif fmt > REVLOGNG:

259

elif fmt > REVLOGNG:

260

raise RevlogError(_("index %s unknown format %d")

260

raise RevlogError(_("index %s unknown format %d")

261

% (self.indexfile, fmt))

261

% (self.indexfile, fmt))

262

263

self._io = revlogio()

263

self._io = revlogio()

264

if self.version == REVLOGV0:

264

if self.version == REVLOGV0:

265

self._io = revlogoldio()

265

self._io = revlogoldio()

266

try:

266

try:

267

d = self._io.parseindex(i, self._inline)

267

d = self._io.parseindex(i, self._inline)

268

except (ValueError, IndexError):

268

except (ValueError, IndexError):

269

raise RevlogError(_("index %s is corrupted") % (self.indexfile))

269

raise RevlogError(_("index %s is corrupted") % (self.indexfile))

270

self.index, nodemap, self._chunkcache = d

270

self.index, nodemap, self._chunkcache = d

271

if nodemap is not None:

271

if nodemap is not None:

272

self.nodemap = self._nodecache = nodemap

272

self.nodemap = self._nodecache = nodemap

273

if not self._chunkcache:

273

if not self._chunkcache:

274

self._chunkclear()

274

self._chunkclear()

275

276

def tip(self):

276

def tip(self):

277

return self.node(len(self.index) - 2)

277

return self.node(len(self.index) - 2)

278

def __len__(self):

278

def __len__(self):

279

return len(self.index) - 1

279

return len(self.index) - 1

280

def __iter__(self):

280

def __iter__(self):

281

for i in xrange(len(self)):

281

for i in xrange(len(self)):

282

yield i

282

yield i

283

284

@util.propertycache

284

@util.propertycache

285

def nodemap(self):

285

def nodemap(self):

286

self.rev(self.node(0))

286

self.rev(self.node(0))

287

return self._nodecache

287

return self._nodecache

288

289

def rev(self, node):

289

def rev(self, node):

290

try:

290

try:

291

return self._nodecache[node]

291

return self._nodecache[node]

292

except KeyError:

292

except KeyError:

293

n = self._nodecache

293

n = self._nodecache

294

i = self.index

294

i = self.index

295

p = self._nodepos

295

p = self._nodepos

296

if p is None:

296

if p is None:

297

p = len(i) - 2

297

p = len(i) - 2

298

for r in xrange(p, -1, -1):

298

for r in xrange(p, -1, -1):

299

v = i[r][7]

299

v = i[r][7]

300

n[v] = r

300

n[v] = r

301

if v == node:

301

if v == node:

302

self._nodepos = r - 1

302

self._nodepos = r - 1

303

return r

303

return r

304

raise LookupError(node, self.indexfile, _('no node'))

304

raise LookupError(node, self.indexfile, _('no node'))

305

306

def node(self, rev):

306

def node(self, rev):

307

return self.index[rev][7]

307

return self.index[rev][7]

308

def linkrev(self, rev):

308

def linkrev(self, rev):

309

return self.index[rev][4]

309

return self.index[rev][4]

310

def parents(self, node):

310

def parents(self, node):

311

i = self.index

311

i = self.index

312

d = i[self.rev(node)]

312

d = i[self.rev(node)]

313

return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline

313

return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline

314

def parentrevs(self, rev):

314

def parentrevs(self, rev):

315

return self.index[rev][5:7]

315

return self.index[rev][5:7]

316

def start(self, rev):

316

def start(self, rev):

317

return int(self.index[rev][0] >> 16)

317

return int(self.index[rev][0] >> 16)

318

def end(self, rev):

318

def end(self, rev):

319

return self.start(rev) + self.length(rev)

319

return self.start(rev) + self.length(rev)

320

def length(self, rev):

320

def length(self, rev):

321

return self.index[rev][1]

321

return self.index[rev][1]

322

def chainbase(self, rev):

322

def chainbase(self, rev):

323

index = self.index

323

index = self.index

324

base = index[rev][3]

324

base = index[rev][3]

325

while base != rev:

325

while base != rev:

326

rev = base

326

rev = base

327

base = index[rev][3]

327

base = index[rev][3]

328

return base

328

return base

329

def flags(self, rev):

329

def flags(self, rev):

330

return self.index[rev][0] & 0xFFFF

330

return self.index[rev][0] & 0xFFFF

331

def rawsize(self, rev):

331

def rawsize(self, rev):

332

"""return the length of the uncompressed text for a given revision"""

332

"""return the length of the uncompressed text for a given revision"""

333

l = self.index[rev][2]

333

l = self.index[rev][2]

334

if l >= 0:

334

if l >= 0:

335

return l

335

return l

336

337

t = self.revision(self.node(rev))

337

t = self.revision(self.node(rev))

338

return len(t)

338

return len(t)

339

size = rawsize

339

size = rawsize

340

341

def reachable(self, node, stop=None):

341

def reachable(self, node, stop=None):

342

"""return the set of all nodes ancestral to a given node, including

342

"""return the set of all nodes ancestral to a given node, including

343

the node itself, stopping when stop is matched"""

343

the node itself, stopping when stop is matched"""

344

reachable = set((node,))

344

reachable = set((node,))

345

visit = [node]

345

visit = [node]

346

if stop:

346

if stop:

347

stopn = self.rev(stop)

347

stopn = self.rev(stop)

348

else:

348

else:

349

stopn = 0

349

stopn = 0

350

while visit:

350

while visit:

351

n = visit.pop(0)

351

n = visit.pop(0)

352

if n == stop:

352

if n == stop:

353

continue

353

continue

354

if n == nullid:

354

if n == nullid:

355

continue

355

continue

356

for p in self.parents(n):

356

for p in self.parents(n):

357

if self.rev(p) < stopn:

357

if self.rev(p) < stopn:

358

continue

358

continue

359

if p not in reachable:

359

if p not in reachable:

360

reachable.add(p)

360

reachable.add(p)

361

visit.append(p)

361

visit.append(p)

362

return reachable

362

return reachable

363

364

def ancestors(self, *revs):

364

def ancestors(self, *revs):

365

"""Generate the ancestors of 'revs' in reverse topological order.

365

"""Generate the ancestors of 'revs' in reverse topological order.

366

367

Yield a sequence of revision numbers starting with the parents

367

Yield a sequence of revision numbers starting with the parents

368

of each revision in revs, i.e., each revision is *not* considered

368

of each revision in revs, i.e., each revision is *not* considered

369

an ancestor of itself. Results are in breadth-first order:

369

an ancestor of itself. Results are in breadth-first order:

370

parents of each rev in revs, then parents of those, etc. Result

370

parents of each rev in revs, then parents of those, etc. Result

371

does not include the null revision."""

371

does not include the null revision."""

372

visit = list(revs)

372

visit = list(revs)

373

seen = set([nullrev])

373

seen = set([nullrev])

374

while visit:

374

while visit:

375

for parent in self.parentrevs(visit.pop(0)):

375

for parent in self.parentrevs(visit.pop(0)):

376

if parent not in seen:

376

if parent not in seen:

377

visit.append(parent)

377

visit.append(parent)

378

seen.add(parent)

378

seen.add(parent)

379

yield parent

379

yield parent

380

381

def descendants(self, *revs):

381

def descendants(self, *revs):

382

"""Generate the descendants of 'revs' in revision order.

382

"""Generate the descendants of 'revs' in revision order.

383

384

Yield a sequence of revision numbers starting with a child of

384

Yield a sequence of revision numbers starting with a child of

385

some rev in revs, i.e., each revision is *not* considered a

385

some rev in revs, i.e., each revision is *not* considered a

386

descendant of itself. Results are ordered by revision number (a

386

descendant of itself. Results are ordered by revision number (a

387

topological sort)."""

387

topological sort)."""

388

first = min(revs)

388

first = min(revs)

389

if first == nullrev:

389

if first == nullrev:

390

for i in self:

390

for i in self:

391

yield i

391

yield i

392

return

392

return

393

394

seen = set(revs)

394

seen = set(revs)

395

for i in xrange(first + 1, len(self)):

395

for i in xrange(first + 1, len(self)):

396

for x in self.parentrevs(i):

396

for x in self.parentrevs(i):

397

if x != nullrev and x in seen:

397

if x != nullrev and x in seen:

398

seen.add(i)

398

seen.add(i)

399

yield i

399

yield i

400

break

400

break

401

402

def findcommonmissing(self, common=None, heads=None):

402

def findcommonmissing(self, common=None, heads=None):

403

"""Return a tuple of the ancestors of common and the ancestors of heads

403

"""Return a tuple of the ancestors of common and the ancestors of heads

404

that are not ancestors of common.

404

that are not ancestors of common.

405

406

More specifically, the second element is a list of nodes N such that

406

More specifically, the second element is a list of nodes N such that

407

every N satisfies the following constraints:

407

every N satisfies the following constraints:

408

409

1. N is an ancestor of some node in 'heads'

409

1. N is an ancestor of some node in 'heads'

410

2. N is not an ancestor of any node in 'common'

410

2. N is not an ancestor of any node in 'common'

411

412

The list is sorted by revision number, meaning it is

412

The list is sorted by revision number, meaning it is

413

topologically sorted.

413

topologically sorted.

414

415

'heads' and 'common' are both lists of node IDs. If heads is

415

'heads' and 'common' are both lists of node IDs. If heads is

416

not supplied, uses all of the revlog's heads. If common is not

416

not supplied, uses all of the revlog's heads. If common is not

417

supplied, uses nullid."""

417

supplied, uses nullid."""

418

if common is None:

418

if common is None:

419

common = [nullid]

419

common = [nullid]

420

if heads is None:

420

if heads is None:

421

heads = self.heads()

421

heads = self.heads()

422

423

common = [self.rev(n) for n in common]

423

common = [self.rev(n) for n in common]

424

heads = [self.rev(n) for n in heads]

424

heads = [self.rev(n) for n in heads]

425

426

# we want the ancestors, but inclusive

426

# we want the ancestors, but inclusive

427

has = set(self.ancestors(*common))

427

has = set(self.ancestors(*common))

428

has.add(nullrev)

428

has.add(nullrev)

429

has.update(common)

429

has.update(common)

430

431

# take all ancestors from heads that aren't in has

431

# take all ancestors from heads that aren't in has

432

missing = set()

432

missing = set()

433

visit = [r for r in heads if r not in has]

433

visit = [r for r in heads if r not in has]

434

while visit:

434

while visit:

435

r = visit.pop(0)

435

r = visit.pop(0)

436

if r in missing:

436

if r in missing:

437

continue

437

continue

438

else:

438

else:

439

missing.add(r)

439

missing.add(r)

440

for p in self.parentrevs(r):

440

for p in self.parentrevs(r):

441

if p not in has:

441

if p not in has:

442

visit.append(p)

442

visit.append(p)

443

missing = list(missing)

443

missing = list(missing)

444

missing.sort()

444

missing.sort()

445

return has, [self.node(r) for r in missing]

445

return has, [self.node(r) for r in missing]

446

447

def findmissing(self, common=None, heads=None):

447

def findmissing(self, common=None, heads=None):

448

"""Return the ancestors of heads that are not ancestors of common.

448

"""Return the ancestors of heads that are not ancestors of common.

449

450

More specifically, return a list of nodes N such that every N

450

More specifically, return a list of nodes N such that every N

451

satisfies the following constraints:

451

satisfies the following constraints:

452

453

1. N is an ancestor of some node in 'heads'

453

1. N is an ancestor of some node in 'heads'

454

2. N is not an ancestor of any node in 'common'

454

2. N is not an ancestor of any node in 'common'

455

456

The list is sorted by revision number, meaning it is

456

The list is sorted by revision number, meaning it is

457

topologically sorted.

457

topologically sorted.

458

459

'heads' and 'common' are both lists of node IDs. If heads is

459

'heads' and 'common' are both lists of node IDs. If heads is

460

not supplied, uses all of the revlog's heads. If common is not

460

not supplied, uses all of the revlog's heads. If common is not

461

supplied, uses nullid."""

461

supplied, uses nullid."""

462

_common, missing = self.findcommonmissing(common, heads)

462

_common, missing = self.findcommonmissing(common, heads)

463

return missing

463

return missing

464

465

def nodesbetween(self, roots=None, heads=None):

465

def nodesbetween(self, roots=None, heads=None):

466

"""Return a topological path from 'roots' to 'heads'.

466

"""Return a topological path from 'roots' to 'heads'.

467

468

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

468

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

469

topologically sorted list of all nodes N that satisfy both of

469

topologically sorted list of all nodes N that satisfy both of

470

these constraints:

470

these constraints:

471

472

1. N is a descendant of some node in 'roots'

472

1. N is a descendant of some node in 'roots'

473

2. N is an ancestor of some node in 'heads'

473

2. N is an ancestor of some node in 'heads'

474

475

Every node is considered to be both a descendant and an ancestor

475

Every node is considered to be both a descendant and an ancestor

476

of itself, so every reachable node in 'roots' and 'heads' will be

476

of itself, so every reachable node in 'roots' and 'heads' will be

477

included in 'nodes'.

477

included in 'nodes'.

478

479

'outroots' is the list of reachable nodes in 'roots', i.e., the

479

'outroots' is the list of reachable nodes in 'roots', i.e., the

480

subset of 'roots' that is returned in 'nodes'. Likewise,

480

subset of 'roots' that is returned in 'nodes'. Likewise,

481

'outheads' is the subset of 'heads' that is also in 'nodes'.

481

'outheads' is the subset of 'heads' that is also in 'nodes'.

482

483

'roots' and 'heads' are both lists of node IDs. If 'roots' is

483

'roots' and 'heads' are both lists of node IDs. If 'roots' is

484

unspecified, uses nullid as the only root. If 'heads' is

484

unspecified, uses nullid as the only root. If 'heads' is

485

unspecified, uses list of all of the revlog's heads."""

485

unspecified, uses list of all of the revlog's heads."""

486

nonodes = ([], [], [])

486

nonodes = ([], [], [])

487

if roots is not None:

487

if roots is not None:

488

roots = list(roots)

488

roots = list(roots)

489

if not roots:

489

if not roots:

490

return nonodes

490

return nonodes

491

lowestrev = min([self.rev(n) for n in roots])

491

lowestrev = min([self.rev(n) for n in roots])

492

else:

492

else:

493

roots = [nullid] # Everybody's a descendent of nullid

493

roots = [nullid] # Everybody's a descendent of nullid

494

lowestrev = nullrev

494

lowestrev = nullrev

495

if (lowestrev == nullrev) and (heads is None):

495

if (lowestrev == nullrev) and (heads is None):

496

# We want _all_ the nodes!

496

# We want _all_ the nodes!

497

return ([self.node(r) for r in self], [nullid], list(self.heads()))

497

return ([self.node(r) for r in self], [nullid], list(self.heads()))

498

if heads is None:

498

if heads is None:

499

# All nodes are ancestors, so the latest ancestor is the last

499

# All nodes are ancestors, so the latest ancestor is the last

500

# node.

500

# node.

501

highestrev = len(self) - 1

501

highestrev = len(self) - 1

502

# Set ancestors to None to signal that every node is an ancestor.

502

# Set ancestors to None to signal that every node is an ancestor.

503

ancestors = None

503

ancestors = None

504

# Set heads to an empty dictionary for later discovery of heads

504

# Set heads to an empty dictionary for later discovery of heads

505

heads = {}

505

heads = {}

506

else:

506

else:

507

heads = list(heads)

507

heads = list(heads)

508

if not heads:

508

if not heads:

509

return nonodes

509

return nonodes

510

ancestors = set()

510

ancestors = set()

511

# Turn heads into a dictionary so we can remove 'fake' heads.

511

# Turn heads into a dictionary so we can remove 'fake' heads.

512

# Also, later we will be using it to filter out the heads we can't

512

# Also, later we will be using it to filter out the heads we can't

513

# find from roots.

513

# find from roots.

514

heads = dict.fromkeys(heads, False)

514

heads = dict.fromkeys(heads, False)

515

# Start at the top and keep marking parents until we're done.

515

# Start at the top and keep marking parents until we're done.

516

nodestotag = set(heads)

516

nodestotag = set(heads)

517

# Remember where the top was so we can use it as a limit later.

517

# Remember where the top was so we can use it as a limit later.

518

highestrev = max([self.rev(n) for n in nodestotag])

518

highestrev = max([self.rev(n) for n in nodestotag])

519

while nodestotag:

519

while nodestotag:

520

# grab a node to tag

520

# grab a node to tag

521

n = nodestotag.pop()

521

n = nodestotag.pop()

522

# Never tag nullid

522

# Never tag nullid

523

if n == nullid:

523

if n == nullid:

524

continue

524

continue

525

# A node's revision number represents its place in a

525

# A node's revision number represents its place in a

526

# topologically sorted list of nodes.

526

# topologically sorted list of nodes.

527

r = self.rev(n)

527

r = self.rev(n)

528

if r >= lowestrev:

528

if r >= lowestrev:

529

if n not in ancestors:

529

if n not in ancestors:

530

# If we are possibly a descendent of one of the roots

530

# If we are possibly a descendent of one of the roots

531

# and we haven't already been marked as an ancestor

531

# and we haven't already been marked as an ancestor

532

ancestors.add(n) # Mark as ancestor

532

ancestors.add(n) # Mark as ancestor

533

# Add non-nullid parents to list of nodes to tag.

533

# Add non-nullid parents to list of nodes to tag.

534

nodestotag.update([p for p in self.parents(n) if

534

nodestotag.update([p for p in self.parents(n) if

535

p != nullid])

535

p != nullid])

536

elif n in heads: # We've seen it before, is it a fake head?

536

elif n in heads: # We've seen it before, is it a fake head?

537

# So it is, real heads should not be the ancestors of

537

# So it is, real heads should not be the ancestors of

538

# any other heads.

538

# any other heads.

539

heads.pop(n)

539

heads.pop(n)

540

if not ancestors:

540

if not ancestors:

541

return nonodes

541

return nonodes

542

# Now that we have our set of ancestors, we want to remove any

542

# Now that we have our set of ancestors, we want to remove any

543

# roots that are not ancestors.

543

# roots that are not ancestors.

544

545

# If one of the roots was nullid, everything is included anyway.

545

# If one of the roots was nullid, everything is included anyway.

546

if lowestrev > nullrev:

546

if lowestrev > nullrev:

547

# But, since we weren't, let's recompute the lowest rev to not

547

# But, since we weren't, let's recompute the lowest rev to not

548

# include roots that aren't ancestors.

548

# include roots that aren't ancestors.

549

550

# Filter out roots that aren't ancestors of heads

550

# Filter out roots that aren't ancestors of heads

551

roots = [n for n in roots if n in ancestors]

551

roots = [n for n in roots if n in ancestors]

552

# Recompute the lowest revision

552

# Recompute the lowest revision

553

if roots:

553

if roots:

554

lowestrev = min([self.rev(n) for n in roots])

554

lowestrev = min([self.rev(n) for n in roots])

555

else:

555

else:

556

# No more roots? Return empty list

556

# No more roots? Return empty list

557

return nonodes

557

return nonodes

558

else:

558

else:

559

# We are descending from nullid, and don't need to care about

559

# We are descending from nullid, and don't need to care about

560

# any other roots.

560

# any other roots.

561

lowestrev = nullrev

561

lowestrev = nullrev

562

roots = [nullid]

562

roots = [nullid]

563

# Transform our roots list into a set.

563

# Transform our roots list into a set.

564

descendents = set(roots)

564

descendents = set(roots)

565

# Also, keep the original roots so we can filter out roots that aren't

565

# Also, keep the original roots so we can filter out roots that aren't

566

# 'real' roots (i.e. are descended from other roots).

566

# 'real' roots (i.e. are descended from other roots).

567

roots = descendents.copy()

567

roots = descendents.copy()

568

# Our topologically sorted list of output nodes.

568

# Our topologically sorted list of output nodes.

569

orderedout = []

569

orderedout = []

570

# Don't start at nullid since we don't want nullid in our output list,

570

# Don't start at nullid since we don't want nullid in our output list,

571

# and if nullid shows up in descedents, empty parents will look like

571

# and if nullid shows up in descedents, empty parents will look like

572

# they're descendents.

572

# they're descendents.

573

for r in xrange(max(lowestrev, 0), highestrev + 1):

573

for r in xrange(max(lowestrev, 0), highestrev + 1):

574

n = self.node(r)

574

n = self.node(r)

575

isdescendent = False

575

isdescendent = False

576

if lowestrev == nullrev: # Everybody is a descendent of nullid

576

if lowestrev == nullrev: # Everybody is a descendent of nullid

577

isdescendent = True

577

isdescendent = True

578

elif n in descendents:

578

elif n in descendents:

579

# n is already a descendent

579

# n is already a descendent

580

isdescendent = True

580

isdescendent = True

581

# This check only needs to be done here because all the roots

581

# This check only needs to be done here because all the roots

582

# will start being marked is descendents before the loop.

582

# will start being marked is descendents before the loop.

583

if n in roots:

583

if n in roots:

584

# If n was a root, check if it's a 'real' root.

584

# If n was a root, check if it's a 'real' root.

585

p = tuple(self.parents(n))

585

p = tuple(self.parents(n))

586

# If any of its parents are descendents, it's not a root.

586

# If any of its parents are descendents, it's not a root.

587

if (p[0] in descendents) or (p[1] in descendents):

587

if (p[0] in descendents) or (p[1] in descendents):

588

roots.remove(n)

588

roots.remove(n)

589

else:

589

else:

590

p = tuple(self.parents(n))

590

p = tuple(self.parents(n))

591

# A node is a descendent if either of its parents are

591

# A node is a descendent if either of its parents are

592

# descendents. (We seeded the dependents list with the roots

592

# descendents. (We seeded the dependents list with the roots

593

# up there, remember?)

593

# up there, remember?)

594

if (p[0] in descendents) or (p[1] in descendents):

594

if (p[0] in descendents) or (p[1] in descendents):

595

descendents.add(n)

595

descendents.add(n)

596

isdescendent = True

596

isdescendent = True

597

if isdescendent and ((ancestors is None) or (n in ancestors)):

597

if isdescendent and ((ancestors is None) or (n in ancestors)):

598

# Only include nodes that are both descendents and ancestors.

598

# Only include nodes that are both descendents and ancestors.

599

orderedout.append(n)

599

orderedout.append(n)

600

if (ancestors is not None) and (n in heads):

600

if (ancestors is not None) and (n in heads):

601

# We're trying to figure out which heads are reachable

601

# We're trying to figure out which heads are reachable

602

# from roots.

602

# from roots.

603

# Mark this head as having been reached

603

# Mark this head as having been reached

604

heads[n] = True

604

heads[n] = True

605

elif ancestors is None:

605

elif ancestors is None:

606

# Otherwise, we're trying to discover the heads.

606

# Otherwise, we're trying to discover the heads.

607

# Assume this is a head because if it isn't, the next step

607

# Assume this is a head because if it isn't, the next step

608

# will eventually remove it.

608

# will eventually remove it.

609

heads[n] = True

609

heads[n] = True

610

# But, obviously its parents aren't.

610

# But, obviously its parents aren't.

611

for p in self.parents(n):

611

for p in self.parents(n):

612

heads.pop(p, None)

612

heads.pop(p, None)

613

heads = [n for n, flag in heads.iteritems() if flag]

613

heads = [n for n, flag in heads.iteritems() if flag]

614

roots = list(roots)

614

roots = list(roots)

615

assert orderedout

615

assert orderedout

616

assert roots

616

assert roots

617

assert heads

617

assert heads

618

return (orderedout, roots, heads)

618

return (orderedout, roots, heads)

619

620

def headrevs(self):

620

def headrevs(self):

621

count = len(self)

621

count = len(self)

622

if not count:

622

if not count:

623

return [nullrev]

623

return [nullrev]

624

ishead = [1] * (count + 1)

624

ishead = [1] * (count + 1)

625

index = self.index

625

index = self.index

626

for r in xrange(count):

626

for r in xrange(count):

627

e = index[r]

627

e = index[r]

628

ishead[e[5]] = ishead[e[6]] = 0

628

ishead[e[5]] = ishead[e[6]] = 0

629

return [r for r in xrange(count) if ishead[r]]

629

return [r for r in xrange(count) if ishead[r]]

630

631

def heads(self, start=None, stop=None):

631

def heads(self, start=None, stop=None):

632

"""return the list of all nodes that have no children

632

"""return the list of all nodes that have no children

633

634

if start is specified, only heads that are descendants of

634

if start is specified, only heads that are descendants of

635

start will be returned

635

start will be returned

636

if stop is specified, it will consider all the revs from stop

636

if stop is specified, it will consider all the revs from stop

637

as if they had no children

637

as if they had no children

638

"""

638

"""

639

if start is None and stop is None:

639

if start is None and stop is None:

640

if not len(self):

640

if not len(self):

641

return [nullid]

641

return [nullid]

642

return [self.node(r) for r in self.headrevs()]

642

return [self.node(r) for r in self.headrevs()]

643

644

if start is None:

644

if start is None:

645

start = nullid

645

start = nullid

646

if stop is None:

646

if stop is None:

647

stop = []

647

stop = []

648

stoprevs = set([self.rev(n) for n in stop])

648

stoprevs = set([self.rev(n) for n in stop])

649

startrev = self.rev(start)

649

startrev = self.rev(start)

650

reachable = set((startrev,))

650

reachable = set((startrev,))

651

heads = set((startrev,))

651

heads = set((startrev,))

652

653

parentrevs = self.parentrevs

653

parentrevs = self.parentrevs

654

for r in xrange(startrev + 1, len(self)):

654

for r in xrange(startrev + 1, len(self)):

655

for p in parentrevs(r):

655

for p in parentrevs(r):

656

if p in reachable:

656

if p in reachable:

657

if r not in stoprevs:

657

if r not in stoprevs:

658

reachable.add(r)

658

reachable.add(r)

659

heads.add(r)

659

heads.add(r)

660

if p in heads and p not in stoprevs:

660

if p in heads and p not in stoprevs:

661

heads.remove(p)

661

heads.remove(p)

662

663

return [self.node(r) for r in heads]

663

return [self.node(r) for r in heads]

664

665

def children(self, node):

665

def children(self, node):

666

"""find the children of a given node"""

666

"""find the children of a given node"""

667

c = []

667

c = []

668

p = self.rev(node)

668

p = self.rev(node)

669

for r in range(p + 1, len(self)):

669

for r in range(p + 1, len(self)):

670

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

670

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

671

if prevs:

671

if prevs:

672

for pr in prevs:

672

for pr in prevs:

673

if pr == p:

673

if pr == p:

674

c.append(self.node(r))

674

c.append(self.node(r))

675

elif p == nullrev:

675

elif p == nullrev:

676

c.append(self.node(r))

676

c.append(self.node(r))

677

return c

677

return c

678

679

def descendant(self, start, end):

679

def descendant(self, start, end):

680

if start == nullrev:

680

if start == nullrev:

681

return True

681

return True

682

for i in self.descendants(start):

682

for i in self.descendants(start):

683

if i == end:

683

if i == end:

684

return True

684

return True

685

elif i > end:

685

elif i > end:

686

break

686

break

687

return False

687

return False

688

689

def ancestor(self, a, b):

689

def ancestor(self, a, b):

690

"""calculate the least common ancestor of nodes a and b"""

690

"""calculate the least common ancestor of nodes a and b"""

691

692

# fast path, check if it is a descendant

692

# fast path, check if it is a descendant

693

a, b = self.rev(a), self.rev(b)

693

a, b = self.rev(a), self.rev(b)

694

start, end = sorted((a, b))

694

start, end = sorted((a, b))

695

if self.descendant(start, end):

695

if self.descendant(start, end):

696

return self.node(start)

696

return self.node(start)

697

698

def parents(rev):

698

def parents(rev):

699

return [p for p in self.parentrevs(rev) if p != nullrev]

699

return [p for p in self.parentrevs(rev) if p != nullrev]

700

701

c = ancestor.ancestor(a, b, parents)

701

c = ancestor.ancestor(a, b, parents)

702

if c is None:

702

if c is None:

703

return nullid

703

return nullid

704

705

return self.node(c)

705

return self.node(c)

706

707

def _match(self, id):

707

def _match(self, id):

708

if isinstance(id, (long, int)):

708

if isinstance(id, (long, int)):

709

# rev

709

# rev

710

return self.node(id)

710

return self.node(id)

711

if len(id) == 20:

711

if len(id) == 20:

712

# possibly a binary node

712

# possibly a binary node

713

# odds of a binary node being all hex in ASCII are 1 in 10**25

713

# odds of a binary node being all hex in ASCII are 1 in 10**25

714

try:

714

try:

715

node = id

715

node = id

716

self.rev(node) # quick search the index

716

self.rev(node) # quick search the index

717

return node

717

return node

718

except LookupError:

718

except LookupError:

719

pass # may be partial hex id

719

pass # may be partial hex id

720

try:

720

try:

721

# str(rev)

721

# str(rev)

722

rev = int(id)

722

rev = int(id)

723

if str(rev) != id:

723

if str(rev) != id:

724

raise ValueError

724

raise ValueError

725

if rev < 0:

725

if rev < 0:

726

rev = len(self) + rev

726

rev = len(self) + rev

727

if rev < 0 or rev >= len(self):

727

if rev < 0 or rev >= len(self):

728

raise ValueError

728

raise ValueError

729

return self.node(rev)

729

return self.node(rev)

730

except (ValueError, OverflowError):

730

except (ValueError, OverflowError):

731

pass

731

pass

732

if len(id) == 40:

732

if len(id) == 40:

733

try:

733

try:

734

# a full hex nodeid?

734

# a full hex nodeid?

735

node = bin(id)

735

node = bin(id)

736

self.rev(node)

736

self.rev(node)

737

return node

737

return node

738

except (TypeError, LookupError):

738

except (TypeError, LookupError):

739

pass

739

pass

740

741

def _partialmatch(self, id):

741

def _partialmatch(self, id):

742

if id in self._pcache:

742

if id in self._pcache:

743

return self._pcache[id]

743

return self._pcache[id]

744

745

if len(id) < 40:

745

if len(id) < 40:

746

try:

746

try:

747

# hex(node)[:...]

747

# hex(node)[:...]

748

l = len(id) // 2 # grab an even number of digits

748

l = len(id) // 2 # grab an even number of digits

749

prefix = bin(id[:l * 2])

749

prefix = bin(id[:l * 2])

750

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

750

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

751

nl = [n for n in nl if hex(n).startswith(id)]

751

nl = [n for n in nl if hex(n).startswith(id)]

752

if len(nl) > 0:

752

if len(nl) > 0:

753

if len(nl) == 1:

753

if len(nl) == 1:

754

self._pcache[id] = nl[0]

754

self._pcache[id] = nl[0]

755

return nl[0]

755

return nl[0]

756

raise LookupError(id, self.indexfile,

756

raise LookupError(id, self.indexfile,

757

_('ambiguous identifier'))

757

_('ambiguous identifier'))

758

return None

758

return None

759

except TypeError:

759

except TypeError:

760

pass

760

pass

761

762

def lookup(self, id):

762

def lookup(self, id):

763

"""locate a node based on:

763

"""locate a node based on:

764

- revision number or str(revision number)

764

- revision number or str(revision number)

765

- nodeid or subset of hex nodeid

765

- nodeid or subset of hex nodeid

766

"""

766

"""

767

n = self._match(id)

767

n = self._match(id)

768

if n is not None:

768

if n is not None:

769

return n

769

return n

770

n = self._partialmatch(id)

770

n = self._partialmatch(id)

771

if n:

771

if n:

772

return n

772

return n

773

774

raise LookupError(id, self.indexfile, _('no match found'))

774

raise LookupError(id, self.indexfile, _('no match found'))

775

776

def cmp(self, node, text):

776

def cmp(self, node, text):

777

"""compare text with a given file revision

777

"""compare text with a given file revision

778

779

returns True if text is different than what is stored.

779

returns True if text is different than what is stored.

780

"""

780

"""

781

p1, p2 = self.parents(node)

781

p1, p2 = self.parents(node)

782

return hash(text, p1, p2) != node

782

return hash(text, p1, p2) != node

783

784

def _addchunk(self, offset, data):

784

def _addchunk(self, offset, data):

785

o, d = self._chunkcache

785

o, d = self._chunkcache

786

# try to add to existing cache

786

# try to add to existing cache

787

if o + len(d) == offset and len(d) + len(data) < _chunksize:

787

if o + len(d) == offset and len(d) + len(data) < _chunksize:

788

self._chunkcache = o, d + data

788

self._chunkcache = o, d + data

789

else:

789

else:

790

self._chunkcache = offset, data

790

self._chunkcache = offset, data

791

792

def _loadchunk(self, offset, length):

792

def _loadchunk(self, offset, length):

793

if self._inline:

793

if self._inline:

794

df = self.opener(self.indexfile)

794

df = self.opener(self.indexfile)

795

else:

795

else:

796

df = self.opener(self.datafile)

796

df = self.opener(self.datafile)

797

798

readahead = max(65536, length)

798

readahead = max(65536, length)

799

df.seek(offset)

799

df.seek(offset)

800

d = df.read(readahead)

800

d = df.read(readahead)

801

self._addchunk(offset, d)

801

self._addchunk(offset, d)

802

if readahead > length:

802

if readahead > length:

803

return d[:length]

803

return d[:length]

804

return d

804

return d

805

806

def _getchunk(self, offset, length):

806

def _getchunk(self, offset, length):

807

o, d = self._chunkcache

807

o, d = self._chunkcache

808

l = len(d)

808

l = len(d)

809

810

# is it in the cache?

810

# is it in the cache?

811

cachestart = offset - o

811

cachestart = offset - o

812

cacheend = cachestart + length

812

cacheend = cachestart + length

813

if cachestart >= 0 and cacheend <= l:

813

if cachestart >= 0 and cacheend <= l:

814

if cachestart == 0 and cacheend == l:

814

if cachestart == 0 and cacheend == l:

815

return d # avoid a copy

815

return d # avoid a copy

816

return d[cachestart:cacheend]

816

return d[cachestart:cacheend]

817

818

return self._loadchunk(offset, length)

818

return self._loadchunk(offset, length)

819

820

def _chunkraw(self, startrev, endrev):

820

def _chunkraw(self, startrev, endrev):

821

start = self.start(startrev)

821

start = self.start(startrev)

822

length = self.end(endrev) - start

822

length = self.end(endrev) - start

823

if self._inline:

823

if self._inline:

824

start += (startrev + 1) * self._io.size

824

start += (startrev + 1) * self._io.size

825

return self._getchunk(start, length)

825

return self._getchunk(start, length)

826

827

def _chunk(self, rev):

827

def _chunk(self, rev):

828

return decompress(self._chunkraw(rev, rev))

828

return decompress(self._chunkraw(rev, rev))

829

830

def _chunkbase(self, rev):

830

def _chunkbase(self, rev):

831

return self._chunk(rev)

831

return self._chunk(rev)

832

833

def _chunkclear(self):

833

def _chunkclear(self):

834

self._chunkcache = (0, '')

834

self._chunkcache = (0, '')

835

836

def deltaparent(self, rev):

836

def deltaparent(self, rev):

837

"""return deltaparent of the given revision"""

837

"""return deltaparent of the given revision"""

838

base = self.index[rev][3]

838

base = self.index[rev][3]

839

if base == rev:

839

if base == rev:

840

return nullrev

840

return nullrev

841

elif self._generaldelta:

841

elif self._generaldelta:

842

return base

842

return base

843

else:

843

else:

844

return rev - 1

844

return rev - 1

845

846

def revdiff(self, rev1, rev2):

846

def revdiff(self, rev1, rev2):

847

"""return or calculate a delta between two revisions"""

847

"""return or calculate a delta between two revisions"""

848

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

848

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

849

return self._chunk(rev2)

849

return self._chunk(rev2)

850

851

return mdiff.textdiff(self.revision(self.node(rev1)),

851

return mdiff.textdiff(self.revision(self.node(rev1)),

852

self.revision(self.node(rev2)))

852

self.revision(self.node(rev2)))

853

854

def revision(self, node):

854

def revision(self, node):

855

"""return an uncompressed revision of a given node"""

855

"""return an uncompressed revision of a given node"""

856

cachedrev = None

856

cachedrev = None

857

if node == nullid:

857

if node == nullid:

858

return ""

858

return ""

859

if self._cache:

859

if self._cache:

860

if self._cache[0] == node:

860

if self._cache[0] == node:

861

return self._cache[2]

861

return self._cache[2]

862

cachedrev = self._cache[1]

862

cachedrev = self._cache[1]

863

864

# look up what we need to read

864

# look up what we need to read

865

text = None

865

text = None

866

rev = self.rev(node)

866

rev = self.rev(node)

867

868

# check rev flags

868

# check rev flags

869

if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:

869

if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:

870

raise RevlogError(_('incompatible revision flag %x') %

870

raise RevlogError(_('incompatible revision flag %x') %

871

(self.flags(rev) & ~REVIDX_KNOWN_FLAGS))

871

(self.flags(rev) & ~REVIDX_KNOWN_FLAGS))

872

873

# build delta chain

873

# build delta chain

874

chain = []

874

chain = []

875

index = self.index # for performance

875

index = self.index # for performance

876

generaldelta = self._generaldelta

876

generaldelta = self._generaldelta

877

iterrev = rev

877

iterrev = rev

878

e = index[iterrev]

878

e = index[iterrev]

879

while iterrev != e[3] and iterrev != cachedrev:

879

while iterrev != e[3] and iterrev != cachedrev:

880

chain.append(iterrev)

880

chain.append(iterrev)

881

if generaldelta:

881

if generaldelta:

882

iterrev = e[3]

882

iterrev = e[3]

883

else:

883

else:

884

iterrev -= 1

884

iterrev -= 1

885

e = index[iterrev]

885

e = index[iterrev]

886

chain.reverse()

886

chain.reverse()

887

base = iterrev

887

base = iterrev

888

889

if iterrev == cachedrev:

889

if iterrev == cachedrev:

890

# cache hit

890

# cache hit

891

text = self._cache[2]

891

text = self._cache[2]

892

893

# drop cache to save memory

893

# drop cache to save memory

894

self._cache = None

894

self._cache = None

895

896

self._chunkraw(base, rev)

896

self._chunkraw(base, rev)

897

if text is None:

897

if text is None:

898

text = self._chunkbase(base)

898

text = self._chunkbase(base)

899

900

bins = [self._chunk(r) for r in chain]

900

bins = [self._chunk(r) for r in chain]

901

text = mdiff.patches(text, bins)

901

text = mdiff.patches(text, bins)

902

903

text = self._checkhash(text, node, rev)

903

text = self._checkhash(text, node, rev)

904

905

self._cache = (node, rev, text)

905

self._cache = (node, rev, text)

906

return text

906

return text

907

908

def _checkhash(self, text, node, rev):

908

def _checkhash(self, text, node, rev):

909

p1, p2 = self.parents(node)

909

p1, p2 = self.parents(node)

910

if node != hash(text, p1, p2):

910

if node != hash(text, p1, p2):

911

raise RevlogError(_("integrity check failed on %s:%d")

911

raise RevlogError(_("integrity check failed on %s:%d")

912

% (self.indexfile, rev))

912

% (self.indexfile, rev))

913

return text

913

return text

914

915

def checkinlinesize(self, tr, fp=None):

915

def checkinlinesize(self, tr, fp=None):

916

if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:

916

if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:

917

return

917

return

918

919

trinfo = tr.find(self.indexfile)

919

trinfo = tr.find(self.indexfile)

920

if trinfo is None:

920

if trinfo is None:

921

raise RevlogError(_("%s not found in the transaction")

921

raise RevlogError(_("%s not found in the transaction")

922

% self.indexfile)

922

% self.indexfile)

923

924

trindex = trinfo[2]

924

trindex = trinfo[2]

925

dataoff = self.start(trindex)

925

dataoff = self.start(trindex)

926

927

tr.add(self.datafile, dataoff)

927

tr.add(self.datafile, dataoff)

928

929

if fp:

929

if fp:

930

fp.flush()

930

fp.flush()

931

fp.close()

931

fp.close()

932

933

df = self.opener(self.datafile, 'w')

933

df = self.opener(self.datafile, 'w')

934

try:

934

try:

935

for r in self:

935

for r in self:

936

df.write(self._chunkraw(r, r))

936

df.write(self._chunkraw(r, r))

937

finally:

937

finally:

938

df.close()

938

df.close()

939

940

fp = self.opener(self.indexfile, 'w', atomictemp=True)

940

fp = self.opener(self.indexfile, 'w', atomictemp=True)

941

self.version &= ~(REVLOGNGINLINEDATA)

941

self.version &= ~(REVLOGNGINLINEDATA)

942

self._inline = False

942

self._inline = False

943

for i in self:

943

for i in self:

944

e = self._io.packentry(self.index[i], self.node, self.version, i)

944

e = self._io.packentry(self.index[i], self.node, self.version, i)

945

fp.write(e)

945

fp.write(e)

946

947

# if we don't call rename, the temp file will never replace the

947

# if we don't call rename, the temp file will never replace the

948

# real index

948

# real index

949

fp.rename()

949

fp.rename()

950

951

tr.replace(self.indexfile, trindex * self._io.size)

951

tr.replace(self.indexfile, trindex * self._io.size)

952

self._chunkclear()

952

self._chunkclear()

953

954

def addrevision(self, text, transaction, link, p1, p2, cachedelta=None):

954

def addrevision(self, text, transaction, link, p1, p2, cachedelta=None):

955

"""add a revision to the log

955

"""add a revision to the log

956

957

text - the revision data to add

957

text - the revision data to add

958

transaction - the transaction object used for rollback

958

transaction - the transaction object used for rollback

959

link - the linkrev data to add

959

link - the linkrev data to add

960

p1, p2 - the parent nodeids of the revision

960

p1, p2 - the parent nodeids of the revision

961

cachedelta - an optional precomputed delta

961

cachedelta - an optional precomputed delta

962

"""

962

"""

963

node = hash(text, p1, p2)

963

node = hash(text, p1, p2)

964

if node in self.nodemap:

964

if node in self.nodemap:

965

return node

965

return node

966

967

dfh = None

967

dfh = None

968

if not self._inline:

968

if not self._inline:

969

dfh = self.opener(self.datafile, "a")

969

dfh = self.opener(self.datafile, "a")

970

ifh = self.opener(self.indexfile, "a+")

970

ifh = self.opener(self.indexfile, "a+")

971

try:

971

try:

972

return self._addrevision(node, text, transaction, link, p1, p2,

972

return self._addrevision(node, text, transaction, link, p1, p2,

973

cachedelta, ifh, dfh)

973

cachedelta, ifh, dfh)

974

finally:

974

finally:

975

if dfh:

975

if dfh:

976

dfh.close()

976

dfh.close()

977

ifh.close()

977

ifh.close()

978

979

def _addrevision(self, node, text, transaction, link, p1, p2,

979

def _addrevision(self, node, text, transaction, link, p1, p2,

980

cachedelta, ifh, dfh):

980

cachedelta, ifh, dfh):

981

"""internal function to add revisions to the log

981

"""internal function to add revisions to the log

982

983

see addrevision for argument descriptions.

983

see addrevision for argument descriptions.

984

invariants:

984

invariants:

985

- text is optional (can be None); if not set, cachedelta must be set.

985

- text is optional (can be None); if not set, cachedelta must be set.

986

if both are set, they must correspond to eachother.

986

if both are set, they must correspond to eachother.

987

"""

987

"""

988

btext = [text]

988

btext = [text]

989

def buildtext():

989

def buildtext():

990

if btext[0] is not None:

990

if btext[0] is not None:

991

return btext[0]

991

return btext[0]

992

# flush any pending writes here so we can read it in revision

992

# flush any pending writes here so we can read it in revision

993

if dfh:

993

if dfh:

994

dfh.flush()

994

dfh.flush()

995

ifh.flush()

995

ifh.flush()

996

basetext = self.revision(self.node(cachedelta[0]))

996

basetext = self.revision(self.node(cachedelta[0]))

997

btext[0] = mdiff.patch(basetext, cachedelta[1])

997

btext[0] = mdiff.patch(basetext, cachedelta[1])

998

chk = hash(btext[0], p1, p2)

998

chk = hash(btext[0], p1, p2)

999

if chk != node:

999

if chk != node:

1000

raise RevlogError(_("consistency error in delta"))

1000

raise RevlogError(_("consistency error in delta"))

1001

return btext[0]

1001

return btext[0]

1002

1003

def builddelta(rev):

1003

def builddelta(rev):

1004

# can we use the cached delta?

1004

# can we use the cached delta?

1005

if cachedelta and cachedelta[0] == rev:

1005

if cachedelta and cachedelta[0] == rev:

1006

delta = cachedelta[1]

1006

delta = cachedelta[1]

1007

else:

1007

else:

1008

t = buildtext()

1008

t = buildtext()

1009

ptext = self.revision(self.node(rev))

1009

ptext = self.revision(self.node(rev))

1010

delta = mdiff.textdiff(ptext, t)

1010

delta = mdiff.textdiff(ptext, t)

1011

data = compress(delta)

1011

data = compress(delta)

1012

l = len(data[1]) + len(data[0])

1012

l = len(data[1]) + len(data[0])

1013

basecache = ~~self~~.~~_basecache~~

1013

if basecache[0] == rev:

1014

if basecache and basecache[0] == rev:

1015

chainbase = basecache[1]

1014

chainbase = basecache[1]

1016

else:

1015

else:

1017

chainbase = self.chainbase(rev)

1016

chainbase = self.chainbase(rev)

1018

dist = l + offset - self.start(chainbase)

1017

dist = l + offset - self.start(chainbase)

1019

if self._generaldelta:

1018

if self._generaldelta:

1020

base = rev

1019

base = rev

1021

else:

1020

else:

1022

base = chainbase

1021

base = chainbase

1023

return dist, l, data, base

1022

return dist, l, data, base, chainbase

1024

1023

1025

curr = len(self)

1024

curr = len(self)

1026

prev = curr - 1

1025

prev = curr - 1

1027

base = curr

1026

base = chainbase = curr

1028

offset = self.end(prev)

1027

offset = self.end(prev)

1029

flags = 0

1028

flags = 0

1030

d = None

1029

d = None

1030

basecache = self._basecache

1031

p1r, p2r = self.rev(p1), self.rev(p2)

1031

p1r, p2r = self.rev(p1), self.rev(p2)

1032

1033

# should we try to build a delta?

1033

# should we try to build a delta?

1034

if prev != nullrev:

1034

if prev != nullrev:

1035

if self._generaldelta:

1035

if self._generaldelta:

1036

d = builddelta(p1r)

1036

d = builddelta(p1r)

1037

else:

1037

else:

1038

d = builddelta(prev)

1038

d = builddelta(prev)

1039

dist, l, data, base = d

1039

dist, l, data, base, chainbase = d

1040

1041

# full versions are inserted when the needed deltas

1041

# full versions are inserted when the needed deltas

1042

# become comparable to the uncompressed text

1042

# become comparable to the uncompressed text

1043

if text is None:

1043

if text is None:

1044

textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),

1044

textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),

1045

cachedelta[1])

1045

cachedelta[1])

1046

else:

1046

else:

1047

textlen = len(text)

1047

textlen = len(text)

1048

if d is None or dist > textlen * 2:

1048

if d is None or dist > textlen * 2:

1049

text = buildtext()

1049

text = buildtext()

1050

data = compress(text)

1050

data = compress(text)

1051

l = len(data[1]) + len(data[0])

1051

l = len(data[1]) + len(data[0])

1052

base = curr

1052

base = chainbase = curr

1053

1054

e = (offset_type(offset, flags), l, textlen,

1054

e = (offset_type(offset, flags), l, textlen,

1055

base, link, p1r, p2r, node)

1055

base, link, p1r, p2r, node)

1056

self.index.insert(-1, e)

1056

self.index.insert(-1, e)

1057

self.nodemap[node] = curr

1057

self.nodemap[node] = curr

1058

1059

entry = self._io.packentry(e, self.node, self.version, curr)

1059

entry = self._io.packentry(e, self.node, self.version, curr)

1060

if not self._inline:

1060

if not self._inline:

1061

transaction.add(self.datafile, offset)

1061

transaction.add(self.datafile, offset)

1062

transaction.add(self.indexfile, curr * len(entry))

1062

transaction.add(self.indexfile, curr * len(entry))

1063

if data[0]:

1063

if data[0]:

1064

dfh.write(data[0])

1064

dfh.write(data[0])

1065

dfh.write(data[1])

1065

dfh.write(data[1])

1066

dfh.flush()

1066

dfh.flush()

1067

ifh.write(entry)

1067

ifh.write(entry)

1068

else:

1068

else:

1069

offset += curr * self._io.size

1069

offset += curr * self._io.size

1070

transaction.add(self.indexfile, offset, curr)

1070

transaction.add(self.indexfile, offset, curr)

1071

ifh.write(entry)

1071

ifh.write(entry)

1072

ifh.write(data[0])

1072

ifh.write(data[0])

1073

ifh.write(data[1])

1073

ifh.write(data[1])

1074

self.checkinlinesize(transaction, ifh)

1074

self.checkinlinesize(transaction, ifh)

1075

1076

if type(text) == str: # only accept immutable objects

1076

if type(text) == str: # only accept immutable objects

1077

self._cache = (node, curr, text)

1077

self._cache = (node, curr, text)

1078

self._basecache = (curr, base)

1078

self._basecache = (curr, chainbase)

1079

return node

1079

return node

1080

1081

def group(self, nodelist, bundler):

1081

def group(self, nodelist, bundler):

1082

"""Calculate a delta group, yielding a sequence of changegroup chunks

1082

"""Calculate a delta group, yielding a sequence of changegroup chunks

1083

(strings).

1083

(strings).

1084

1085

Given a list of changeset revs, return a set of deltas and

1085

Given a list of changeset revs, return a set of deltas and

1086

metadata corresponding to nodes. The first delta is

1086

metadata corresponding to nodes. The first delta is

1087

first parent(nodelist[0]) -> nodelist[0], the receiver is

1087

first parent(nodelist[0]) -> nodelist[0], the receiver is

1088

guaranteed to have this parent as it has all history before

1088

guaranteed to have this parent as it has all history before

1089

these changesets. In the case firstparent is nullrev the

1089

these changesets. In the case firstparent is nullrev the

1090

changegroup starts with a full revision.

1090

changegroup starts with a full revision.

1091

"""

1091

"""

1092

1093

revs = sorted([self.rev(n) for n in nodelist])

1093

revs = sorted([self.rev(n) for n in nodelist])

1094

1095

# if we don't have any revisions touched by these changesets, bail

1095

# if we don't have any revisions touched by these changesets, bail

1096

if not revs:

1096

if not revs:

1097

yield bundler.close()

1097

yield bundler.close()

1098

return

1098

return

1099

1100

# add the parent of the first rev

1100

# add the parent of the first rev

1101

p = self.parentrevs(revs[0])[0]

1101

p = self.parentrevs(revs[0])[0]

1102

revs.insert(0, p)

1102

revs.insert(0, p)

1103

1104

# build deltas

1104

# build deltas

1105

for r in xrange(len(revs) - 1):

1105

for r in xrange(len(revs) - 1):

1106

prev, curr = revs[r], revs[r + 1]

1106

prev, curr = revs[r], revs[r + 1]

1107

for c in bundler.revchunk(self, curr, prev):

1107

for c in bundler.revchunk(self, curr, prev):

1108

yield c

1108

yield c

1109

1110

yield bundler.close()

1110

yield bundler.close()

1111

1112

def addgroup(self, bundle, linkmapper, transaction):

1112

def addgroup(self, bundle, linkmapper, transaction):

1113

"""

1113

"""

1114

add a delta group

1114

add a delta group

1115

1116

given a set of deltas, add them to the revision log. the

1116

given a set of deltas, add them to the revision log. the

1117

first delta is against its parent, which should be in our

1117

first delta is against its parent, which should be in our

1118

log, the rest are against the previous delta.

1118

log, the rest are against the previous delta.

1119

"""

1119

"""

1120

1121

# track the base of the current delta log

1121

# track the base of the current delta log

1122

node = None

1122

node = None

1123

1124

r = len(self)

1124

r = len(self)

1125

end = 0

1125

end = 0

1126

if r:

1126

if r:

1127

end = self.end(r - 1)

1127

end = self.end(r - 1)

1128

ifh = self.opener(self.indexfile, "a+")

1128

ifh = self.opener(self.indexfile, "a+")

1129

isize = r * self._io.size

1129

isize = r * self._io.size

1130

if self._inline:

1130

if self._inline:

1131

transaction.add(self.indexfile, end + isize, r)

1131

transaction.add(self.indexfile, end + isize, r)

1132

dfh = None

1132

dfh = None

1133

else:

1133

else:

1134

transaction.add(self.indexfile, isize, r)

1134

transaction.add(self.indexfile, isize, r)

1135

transaction.add(self.datafile, end)

1135

transaction.add(self.datafile, end)

1136

dfh = self.opener(self.datafile, "a")

1136

dfh = self.opener(self.datafile, "a")

1137

1138

try:

1138

try:

1139

# loop through our set of deltas

1139

# loop through our set of deltas

1140

chain = None

1140

chain = None

1141

while 1:

1141

while 1:

1142

chunkdata = bundle.deltachunk(chain)

1142

chunkdata = bundle.deltachunk(chain)

1143

if not chunkdata:

1143

if not chunkdata:

1144

break

1144

break

1145

node = chunkdata['node']

1145

node = chunkdata['node']

1146

p1 = chunkdata['p1']

1146

p1 = chunkdata['p1']

1147

p2 = chunkdata['p2']

1147

p2 = chunkdata['p2']

1148

cs = chunkdata['cs']

1148

cs = chunkdata['cs']

1149

deltabase = chunkdata['deltabase']

1149

deltabase = chunkdata['deltabase']

1150

delta = chunkdata['delta']

1150

delta = chunkdata['delta']

1151

1152

link = linkmapper(cs)

1152

link = linkmapper(cs)

1153

if node in self.nodemap:

1153

if node in self.nodemap:

1154

# this can happen if two branches make the same change

1154

# this can happen if two branches make the same change

1155

chain = node

1155

chain = node

1156

continue

1156

continue

1157

1158

for p in (p1, p2):

1158

for p in (p1, p2):

1159

if not p in self.nodemap:

1159

if not p in self.nodemap:

1160

raise LookupError(p, self.indexfile,

1160

raise LookupError(p, self.indexfile,

1161

_('unknown parent'))

1161

_('unknown parent'))

1162

1163

if deltabase not in self.nodemap:

1163

if deltabase not in self.nodemap:

1164

raise LookupError(deltabase, self.indexfile,

1164

raise LookupError(deltabase, self.indexfile,

1165

_('unknown delta base'))

1165

_('unknown delta base'))

1166

1167

baserev = self.rev(deltabase)

1167

baserev = self.rev(deltabase)

1168

chain = self._addrevision(node, None, transaction, link,

1168

chain = self._addrevision(node, None, transaction, link,

1169

p1, p2, (baserev, delta), ifh, dfh)

1169

p1, p2, (baserev, delta), ifh, dfh)

1170

if not dfh and not self._inline:

1170

if not dfh and not self._inline:

1171

# addrevision switched from inline to conventional

1171

# addrevision switched from inline to conventional

1172

# reopen the index

1172

# reopen the index

1173

ifh.close()

1173

ifh.close()

1174

dfh = self.opener(self.datafile, "a")

1174

dfh = self.opener(self.datafile, "a")

1175

ifh = self.opener(self.indexfile, "a")

1175

ifh = self.opener(self.indexfile, "a")

1176

finally:

1176

finally:

1177

if dfh:

1177

if dfh:

1178

dfh.close()

1178

dfh.close()

1179

ifh.close()

1179

ifh.close()

1180

1181

return node

1181

return node

1182

1183

def strip(self, minlink, transaction):

1183

def strip(self, minlink, transaction):

1184

"""truncate the revlog on the first revision with a linkrev >= minlink

1184

"""truncate the revlog on the first revision with a linkrev >= minlink

1185

1186

This function is called when we're stripping revision minlink and

1186

This function is called when we're stripping revision minlink and

1187

its descendants from the repository.

1187

its descendants from the repository.

1188

1189

We have to remove all revisions with linkrev >= minlink, because

1189

We have to remove all revisions with linkrev >= minlink, because

1190

the equivalent changelog revisions will be renumbered after the

1190

the equivalent changelog revisions will be renumbered after the

1191

strip.

1191

strip.

1192

1193

So we truncate the revlog on the first of these revisions, and

1193

So we truncate the revlog on the first of these revisions, and

1194

trust that the caller has saved the revisions that shouldn't be

1194

trust that the caller has saved the revisions that shouldn't be

1195

removed and that it'll readd them after this truncation.

1195

removed and that it'll readd them after this truncation.

1196

"""

1196

"""

1197

if len(self) == 0:

1197

if len(self) == 0:

1198

return

1198

return

1199

1200

for rev in self:

1200

for rev in self:

1201

if self.index[rev][4] >= minlink:

1201

if self.index[rev][4] >= minlink:

1202

break

1202

break

1203

else:

1203

else:

1204

return

1204

return

1205

1206

# first truncate the files on disk

1206

# first truncate the files on disk

1207

end = self.start(rev)

1207

end = self.start(rev)

1208

if not self._inline:

1208

if not self._inline:

1209

transaction.add(self.datafile, end)

1209

transaction.add(self.datafile, end)

1210

end = rev * self._io.size

1210

end = rev * self._io.size

1211

else:

1211

else:

1212

end += rev * self._io.size

1212

end += rev * self._io.size

1213

1214

transaction.add(self.indexfile, end)

1214

transaction.add(self.indexfile, end)

1215

1216

# then reset internal state in memory to forget those revisions

1216

# then reset internal state in memory to forget those revisions

1217

self._cache = None

1217

self._cache = None

1218

self._chunkclear()

1218

self._chunkclear()

1219

for x in xrange(rev, len(self)):

1219

for x in xrange(rev, len(self)):

1220

del self.nodemap[self.node(x)]

1220

del self.nodemap[self.node(x)]

1221

1222

del self.index[rev:-1]

1222

del self.index[rev:-1]

1223

1224

def checksize(self):

1224

def checksize(self):

1225

expected = 0

1225

expected = 0

1226

if len(self):

1226

if len(self):

1227

expected = max(0, self.end(len(self) - 1))

1227

expected = max(0, self.end(len(self) - 1))

1228

1229

try:

1229

try:

1230

f = self.opener(self.datafile)

1230

f = self.opener(self.datafile)

1231

f.seek(0, 2)

1231

f.seek(0, 2)

1232

actual = f.tell()

1232

actual = f.tell()

1233

f.close()

1233

f.close()

1234

dd = actual - expected

1234

dd = actual - expected

1235

except IOError, inst:

1235

except IOError, inst:

1236

if inst.errno != errno.ENOENT:

1236

if inst.errno != errno.ENOENT:

1237

raise

1237

raise

1238

dd = 0

1238

dd = 0

1239

1240

try:

1240

try:

1241

f = self.opener(self.indexfile)

1241

f = self.opener(self.indexfile)

1242

f.seek(0, 2)

1242

f.seek(0, 2)

1243

actual = f.tell()

1243

actual = f.tell()

1244

f.close()

1244

f.close()

1245

s = self._io.size

1245

s = self._io.size

1246

i = max(0, actual // s)

1246

i = max(0, actual // s)

1247

di = actual - (i * s)

1247

di = actual - (i * s)

1248

if self._inline:

1248

if self._inline:

1249

databytes = 0

1249

databytes = 0

1250

for r in self:

1250

for r in self:

1251

databytes += max(0, self.length(r))

1251

databytes += max(0, self.length(r))

1252

dd = 0

1252

dd = 0

1253

di = actual - len(self) * s - databytes

1253

di = actual - len(self) * s - databytes

1254

except IOError, inst:

1254

except IOError, inst:

1255

if inst.errno != errno.ENOENT:

1255

if inst.errno != errno.ENOENT:

1256

raise

1256

raise

1257

di = 0

1257

di = 0

1258

1259

return (dd, di)

1259

return (dd, di)

1260

1261

def files(self):

1261

def files(self):

1262

res = [self.indexfile]

1262

res = [self.indexfile]

1263

if not self._inline:

1263

if not self._inline:

1264

res.append(self.datafile)

1264

res.append(self.datafile)

1265

return res

1265

return res

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # revlog.py - storage back-end for mercurial
             #
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             # import stuff from node for others to import from revlog
             from node import bin, hex, nullid, nullrev, short #@UnusedImport
             from i18n import _
             import ancestor, mdiff, parsers, error, util
             import struct, zlib, errno
             _pack = struct.pack
             _unpack = struct.unpack
             _compress = zlib.compress
             _decompress = zlib.decompress
             _sha = util.sha1
             # revlog header flags
             REVLOGV0 = 0
             REVLOGNG = 1
             REVLOGNGINLINEDATA = (1 << 16)
             REVLOGGENERALDELTA = (1 << 17)
             REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA
             REVLOG_DEFAULT_FORMAT = REVLOGNG
             REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS
             REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGGENERALDELTA
             # revlog index flags
             REVIDX_KNOWN_FLAGS = 0
             # max size of revlog with inline data
             _maxinline = 131072
             _chunksize = 1048576
             RevlogError = error.RevlogError
             LookupError = error.LookupError
             def getoffset(q):
                 return int(q >> 16)
             def gettype(q):
                 return int(q & 0xFFFF)
             def offset_type(offset, type):
                 return long(long(offset) << 16 | type)
             nullhash = _sha(nullid)
             def hash(text, p1, p2):
                 """generate a hash from the given text and its parent hashes
                 This hash combines both the current file contents and its history
                 in a manner that makes it easy to distinguish nodes with the same
                 content in the revision graph.
                 """
                 # As of now, if one of the parent node is null, p2 is null
                 if p2 == nullid:
                     # deep copy of a hash is faster than creating one
                     s = nullhash.copy()
                     s.update(p1)
                 else:
                     # none of the parent nodes are nullid
                     l = [p1, p2]
                     l.sort()
                     s = _sha(l[0])
                     s.update(l[1])
                 s.update(text)
                 return s.digest()
             def compress(text):
                 """ generate a possibly-compressed representation of text """
                 if not text:
                     return ("", text)
                 l = len(text)
                 bin = None
                 if l < 44:
                     pass
                 elif l > 1000000:
                     # zlib makes an internal copy, thus doubling memory usage for
                     # large files, so lets do this in pieces
                     z = zlib.compressobj()
                     p = []
                     pos = 0
                     while pos < l:
                         pos2 = pos + 2**20
                         p.append(z.compress(text[pos:pos2]))
                         pos = pos2
                     p.append(z.flush())
                     if sum(map(len, p)) < l:
                         bin = "".join(p)
                 else:
                     bin = _compress(text)
                 if bin is None or len(bin) > l:
                     if text[0] == '\0':
                         return ("", text)
                     return ('u', text)
                 return ("", bin)
             def decompress(bin):
                 """ decompress the given input """
                 if not bin:
                     return bin
                 t = bin[0]
                 if t == '\0':
                     return bin
                 if t == 'x':
                     return _decompress(bin)
                 if t == 'u':
                     return bin[1:]
                 raise RevlogError(_("unknown compression type %r") % t)
             indexformatv0 = ">4l20s20s20s"
             v0shaoffset = 56
             class revlogoldio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatv0)
                 def parseindex(self, data, inline):
                     s = self.size
                     index = []
                     nodemap =  {nullid: nullrev}
                     n = off = 0
                     l = len(data)
                     while off + s <= l:
                         cur = data[off:off + s]
                         off += s
                         e = _unpack(indexformatv0, cur)
                         # transform to revlogv1 format
                         e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],
                               nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])
                         index.append(e2)
                         nodemap[e[6]] = n
                         n += 1
                     # add the magic null revision at -1
                     index.append((0, 0, 0, -1, -1, -1, -1, nullid))
                     return index, nodemap, None
                 def packentry(self, entry, node, version, rev):
                     if gettype(entry[0]):
                         raise RevlogError(_("index entry flags need RevlogNG"))
                     e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],
                           node(entry[5]), node(entry[6]), entry[7])
                     return _pack(indexformatv0, *e2)
             # index ng:
             #  6 bytes: offset
             #  2 bytes: flags
             #  4 bytes: compressed length
             #  4 bytes: uncompressed length
             #  4 bytes: base rev
             #  4 bytes: link rev
             #  4 bytes: parent 1 rev
             #  4 bytes: parent 2 rev
             # 32 bytes: nodeid
             indexformatng = ">Qiiiiii20s12x"
             ngshaoffset = 32
             versionformat = ">I"
             class revlogio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatng)
                 def parseindex(self, data, inline):
                     # call the C implementation to parse the index data
                     index, cache = parsers.parse_index2(data, inline)
                     return index, None, cache
                 def packentry(self, entry, node, version, rev):
                     p = _pack(indexformatng, *entry)
                     if rev == 0:
                         p = _pack(versionformat, version) + p[4:]
                     return p
             class revlog(object):
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 """
                 def __init__(self, opener, indexfile):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     """
                     self.indexfile = indexfile
                     self.datafile = indexfile[:-2] + ".d"
                     self.opener = opener
                     self._cache = None
-                    self._basecache = None
+                    self._basecache = (0, 0)
                     self._chunkcache = (0, '')
                     self.index = []
                     self._pcache = {}
                     self._nodecache = {nullid: nullrev}
                     self._nodepos = None
                     v = REVLOG_DEFAULT_VERSION
                     if hasattr(opener, 'options'):
                         if 'defversion' in opener.options:
                             v = opener.options['defversion']
                             if v & REVLOGNG:
                                 v |= REVLOGNGINLINEDATA
                         if v & REVLOGNG and 'generaldelta' in opener.options:
                             v |= REVLOGGENERALDELTA
                     i = ''
                     try:
                         f = self.opener(self.indexfile)
                         i = f.read()
                         f.close()
                         if len(i) > 0:
                             v = struct.unpack(versionformat, i[:4])[0]
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                     self.version = v
                     self._inline = v & REVLOGNGINLINEDATA
                     self._generaldelta = v & REVLOGGENERALDELTA
                     flags = v & ~0xFFFF
                     fmt = v & 0xFFFF
                     if fmt == REVLOGV0 and flags:
                         raise RevlogError(_("index %s unknown flags %#04x for format v0")
                                           % (self.indexfile, flags >> 16))
                     elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:
                         raise RevlogError(_("index %s unknown flags %#04x for revlogng")
                                           % (self.indexfile, flags >> 16))
                     elif fmt > REVLOGNG:
                         raise RevlogError(_("index %s unknown format %d")
                                           % (self.indexfile, fmt))
                     self._io = revlogio()
                     if self.version == REVLOGV0:
                         self._io = revlogoldio()
                     try:
                         d = self._io.parseindex(i, self._inline)
                     except (ValueError, IndexError):
                         raise RevlogError(_("index %s is corrupted") % (self.indexfile))
                     self.index, nodemap, self._chunkcache = d
                     if nodemap is not None:
                         self.nodemap = self._nodecache = nodemap
                     if not self._chunkcache:
                         self._chunkclear()
                 def tip(self):
                     return self.node(len(self.index) - 2)
                 def __len__(self):
                     return len(self.index) - 1
                 def __iter__(self):
                     for i in xrange(len(self)):
                         yield i
                 @util.propertycache
                 def nodemap(self):
                     self.rev(self.node(0))
                     return self._nodecache
                 def rev(self, node):
                     try:
                         return self._nodecache[node]
                     except KeyError:
                         n = self._nodecache
                         i = self.index
                         p = self._nodepos
                         if p is None:
                             p = len(i) - 2
                         for r in xrange(p, -1, -1):
                             v = i[r][7]
                             n[v] = r
                             if v == node:
                                 self._nodepos = r - 1
                                 return r
                         raise LookupError(node, self.indexfile, _('no node'))
                 def node(self, rev):
                     return self.index[rev][7]
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline
                 def parentrevs(self, rev):
                     return self.index[rev][5:7]
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def length(self, rev):
                     return self.index[rev][1]
                 def chainbase(self, rev):
                     index = self.index
                     base = index[rev][3]
                     while base != rev:
                         rev = base
                         base = index[rev][3]
                     return base
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.revision(self.node(rev))
                     return len(t)
                 size = rawsize
                 def reachable(self, node, stop=None):
                     """return the set of all nodes ancestral to a given node, including
                      the node itself, stopping when stop is matched"""
                     reachable = set((node,))
                     visit = [node]
                     if stop:
                         stopn = self.rev(stop)
                     else:
                         stopn = 0
                     while visit:
                         n = visit.pop(0)
                         if n == stop:
                             continue
                         if n == nullid:
                             continue
                         for p in self.parents(n):
                             if self.rev(p) < stopn:
                                 continue
                             if p not in reachable:
                                 reachable.add(p)
                                 visit.append(p)
                     return reachable
                 def ancestors(self, *revs):
                     """Generate the ancestors of 'revs' in reverse topological order.
                     Yield a sequence of revision numbers starting with the parents
                     of each revision in revs, i.e., each revision is *not* considered
                     an ancestor of itself.  Results are in breadth-first order:
                     parents of each rev in revs, then parents of those, etc.  Result
                     does not include the null revision."""
                     visit = list(revs)
                     seen = set([nullrev])
                     while visit:
                         for parent in self.parentrevs(visit.pop(0)):
                             if parent not in seen:
                                 visit.append(parent)
                                 seen.add(parent)
                                 yield parent
                 def descendants(self, *revs):
                     """Generate the descendants of 'revs' in revision order.
                     Yield a sequence of revision numbers starting with a child of
                     some rev in revs, i.e., each revision is *not* considered a
                     descendant of itself.  Results are ordered by revision number (a
                     topological sort)."""
                     first = min(revs)
                     if first == nullrev:
                         for i in self:
                             yield i
                         return
                     seen = set(revs)
                     for i in xrange(first + 1, len(self)):
                         for x in self.parentrevs(i):
                             if x != nullrev and x in seen:
                                 seen.add(i)
                                 yield i
                                 break
                 def findcommonmissing(self, common=None, heads=None):
                     """Return a tuple of the ancestors of common and the ancestors of heads
                     that are not ancestors of common.
                     More specifically, the second element is a list of nodes N such that
                     every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     has = set(self.ancestors(*common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = [r for r in heads if r not in has]
                     while visit:
                         r = visit.pop(0)
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return has, [self.node(r) for r in missing]
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     _common, missing = self.findcommonmissing(common, heads)
                     return missing
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [nullid] # Everybody's a descendent of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return ([self.node(r) for r in self], [nullid], list(self.heads()))
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, False)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendent of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n) # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update([p for p in self.parents(n) if
                                                        p != nullid])
                                 elif n in heads: # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [n for n in roots if n in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(n) for n in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [nullid]
                     # Transform our roots list into a set.
                     descendents = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendents.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descedents, empty parents will look like
                     # they're descendents.
                     for r in xrange(max(lowestrev, 0), highestrev + 1):
                         n = self.node(r)
                         isdescendent = False
                         if lowestrev == nullrev:  # Everybody is a descendent of nullid
                             isdescendent = True
                         elif n in descendents:
                             # n is already a descendent
                             isdescendent = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendents before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendents, it's not a root.
                                 if (p[0] in descendents) or (p[1] in descendents):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendent if either of its parents are
                             # descendents.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendents) or (p[1] in descendents):
                                 descendents.add(n)
                                 isdescendent = True
                         if isdescendent and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendents and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = True
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = True
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [n for n, flag in heads.iteritems() if flag]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def headrevs(self):
                     count = len(self)
                     if not count:
                         return [nullrev]
                     ishead = [1] * (count + 1)
                     index = self.index
                     for r in xrange(count):
                         e = index[r]
                         ishead[e[5]] = ishead[e[6]] = 0
                     return [r for r in xrange(count) if ishead[r]]
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         if not len(self):
                             return [nullid]
                         return [self.node(r) for r in self.headrevs()]
                     if start is None:
                         start = nullid
                     if stop is None:
                         stop = []
                     stoprevs = set([self.rev(n) for n in stop])
                     startrev = self.rev(start)
                     reachable = set((startrev,))
                     heads = set((startrev,))
                     parentrevs = self.parentrevs
                     for r in xrange(startrev + 1, len(self)):
                         for p in parentrevs(r):
                             if p in reachable:
                                 if r not in stoprevs:
                                     reachable.add(r)
                                 heads.add(r)
                             if p in heads and p not in stoprevs:
                                 heads.remove(p)
                     return [self.node(r) for r in heads]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in range(p + 1, len(self)):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def descendant(self, start, end):
                     if start == nullrev:
                         return True
                     for i in self.descendants(start):
                         if i == end:
                             return True
                         elif i > end:
                             break
                     return False
                 def ancestor(self, a, b):
                     """calculate the least common ancestor of nodes a and b"""
                     # fast path, check if it is a descendant
                     a, b = self.rev(a), self.rev(b)
                     start, end = sorted((a, b))
                     if self.descendant(start, end):
                         return self.node(start)
                     def parents(rev):
                         return [p for p in self.parentrevs(rev) if p != nullrev]
                     c = ancestor.ancestor(a, b, parents)
                     if c is None:
                         return nullid
                     return self.node(c)
                 def _match(self, id):
                     if isinstance(id, (long, int)):
                         # rev
                         return self.node(id)
                     if len(id) == 20:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node) # quick search the index
                             return node
                         except LookupError:
                             pass # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if str(rev) != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 40:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (TypeError, LookupError):
                             pass
                 def _partialmatch(self, id):
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) < 40:
                         try:
                             # hex(node)[:...]
                             l = len(id) // 2  # grab an even number of digits
                             prefix = bin(id[:l * 2])
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [n for n in nl if hex(n).startswith(id)]
                             if len(nl) > 0:
                                 if len(nl) == 1:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise LookupError(id, self.indexfile,
                                                   _('ambiguous identifier'))
                             return None
                         except TypeError:
                             pass
                 def lookup(self, id):
                     """locate a node based on:
                         - revision number or str(revision number)
                         - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise LookupError(id, self.indexfile, _('no match found'))
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return hash(text, p1, p2) != node
                 def _addchunk(self, offset, data):
                     o, d = self._chunkcache
                     # try to add to existing cache
                     if o + len(d) == offset and len(d) + len(data) < _chunksize:
                         self._chunkcache = o, d + data
                     else:
                         self._chunkcache = offset, data
                 def _loadchunk(self, offset, length):
                     if self._inline:
                         df = self.opener(self.indexfile)
                     else:
                         df = self.opener(self.datafile)
                     readahead = max(65536, length)
                     df.seek(offset)
                     d = df.read(readahead)
                     self._addchunk(offset, d)
                     if readahead > length:
                         return d[:length]
                     return d
                 def _getchunk(self, offset, length):
                     o, d = self._chunkcache
                     l = len(d)
                     # is it in the cache?
                     cachestart = offset - o
                     cacheend = cachestart + length
                     if cachestart >= 0 and cacheend <= l:
                         if cachestart == 0 and cacheend == l:
                             return d # avoid a copy
                         return d[cachestart:cacheend]
                     return self._loadchunk(offset, length)
                 def _chunkraw(self, startrev, endrev):
                     start = self.start(startrev)
                     length = self.end(endrev) - start
                     if self._inline:
                         start += (startrev + 1) * self._io.size
                     return self._getchunk(start, length)
                 def _chunk(self, rev):
                     return decompress(self._chunkraw(rev, rev))
                 def _chunkbase(self, rev):
                     return self._chunk(rev)
                 def _chunkclear(self):
                     self._chunkcache = (0, '')
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self._generaldelta:
                         return base
                     else:
                         return rev - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions"""
                     if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                         return self._chunk(rev2)
                     return mdiff.textdiff(self.revision(self.node(rev1)),
                                           self.revision(self.node(rev2)))
                 def revision(self, node):
                     """return an uncompressed revision of a given node"""
                     cachedrev = None
                     if node == nullid:
                         return ""
                     if self._cache:
                         if self._cache[0] == node:
                             return self._cache[2]
                         cachedrev = self._cache[1]
                     # look up what we need to read
                     text = None
                     rev = self.rev(node)
                     # check rev flags
                     if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:
                         raise RevlogError(_('incompatible revision flag %x') %
                                           (self.flags(rev) & ~REVIDX_KNOWN_FLAGS))
                     # build delta chain
                     chain = []
                     index = self.index # for performance
                     generaldelta = self._generaldelta
                     iterrev = rev
                     e = index[iterrev]
                     while iterrev != e[3] and iterrev != cachedrev:
                         chain.append(iterrev)
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         e = index[iterrev]
                     chain.reverse()
                     base = iterrev
                     if iterrev == cachedrev:
                         # cache hit
                         text = self._cache[2]
                     # drop cache to save memory
                     self._cache = None
                     self._chunkraw(base, rev)
                     if text is None:
                         text = self._chunkbase(base)
                     bins = [self._chunk(r) for r in chain]
                     text = mdiff.patches(text, bins)
                     text = self._checkhash(text, node, rev)
                     self._cache = (node, rev, text)
                     return text
                 def _checkhash(self, text, node, rev):
                     p1, p2 = self.parents(node)
                     if node != hash(text, p1, p2):
                         raise RevlogError(_("integrity check failed on %s:%d")
                                           % (self.indexfile, rev))
                     return text
                 def checkinlinesize(self, tr, fp=None):
                     if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:
                         return
                     trinfo = tr.find(self.indexfile)
                     if trinfo is None:
                         raise RevlogError(_("%s not found in the transaction")
                                           % self.indexfile)
                     trindex = trinfo[2]
                     dataoff = self.start(trindex)
                     tr.add(self.datafile, dataoff)
                     if fp:
                         fp.flush()
                         fp.close()
                     df = self.opener(self.datafile, 'w')
                     try:
                         for r in self:
                             df.write(self._chunkraw(r, r))
                     finally:
                         df.close()
                     fp = self.opener(self.indexfile, 'w', atomictemp=True)
                     self.version &= ~(REVLOGNGINLINEDATA)
                     self._inline = False
                     for i in self:
                         e = self._io.packentry(self.index[i], self.node, self.version, i)
                         fp.write(e)
                     # if we don't call rename, the temp file will never replace the
                     # real index
                     fp.rename()
                     tr.replace(self.indexfile, trindex * self._io.size)
                     self._chunkclear()
                 def addrevision(self, text, transaction, link, p1, p2, cachedelta=None):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     """
                     node = hash(text, p1, p2)
                     if node in self.nodemap:
                         return node
                     dfh = None
                     if not self._inline:
                         dfh = self.opener(self.datafile, "a")
                     ifh = self.opener(self.indexfile, "a+")
                     try:
                         return self._addrevision(node, text, transaction, link, p1, p2,
                                                  cachedelta, ifh, dfh)
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                 def _addrevision(self, node, text, transaction, link, p1, p2,
                                  cachedelta, ifh, dfh):
                     """internal function to add revisions to the log
                     see addrevision for argument descriptions.
                     invariants:
                     - text is optional (can be None); if not set, cachedelta must be set.
                       if both are set, they must correspond to eachother.
                     """
                     btext = [text]
                     def buildtext():
                         if btext[0] is not None:
                             return btext[0]
                         # flush any pending writes here so we can read it in revision
                         if dfh:
                             dfh.flush()
                         ifh.flush()
                         basetext = self.revision(self.node(cachedelta[0]))
                         btext[0] = mdiff.patch(basetext, cachedelta[1])
                         chk = hash(btext[0], p1, p2)
                         if chk != node:
                             raise RevlogError(_("consistency error in delta"))
                         return btext[0]
                     def builddelta(rev):
                         # can we use the cached delta?
                         if cachedelta and cachedelta[0] == rev:
                             delta = cachedelta[1]
                         else:
                             t = buildtext()
                             ptext = self.revision(self.node(rev))
                             delta = mdiff.textdiff(ptext, t)
                         data = compress(delta)
                         l = len(data[1]) + len(data[0])
-                        basecache = self._basecache
+                        if basecache[0] == rev:
-                        if basecache and basecache[0] == rev:
                             chainbase = basecache[1]
                         else:
                             chainbase = self.chainbase(rev)
                         dist = l + offset - self.start(chainbase)
                         if self._generaldelta:
                             base = rev
                         else:
                             base = chainbase
-                        return dist, l, data, base
+                        return dist, l, data, base, chainbase
                     curr = len(self)
                     prev = curr - 1
-                    base = curr
+                    base = chainbase = curr
                     offset = self.end(prev)
                     flags = 0
                     d = None
+                    basecache = self._basecache
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # should we try to build a delta?
                     if prev != nullrev:
                         if self._generaldelta:
                             d = builddelta(p1r)
                         else:
                             d = builddelta(prev)
-                        dist, l, data, base = d
+                        dist, l, data, base, chainbase = d
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if text is None:
                         textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),
                                                     cachedelta[1])
                     else:
                         textlen = len(text)
                     if d is None or dist > textlen * 2:
                         text = buildtext()
                         data = compress(text)
                         l = len(data[1]) + len(data[0])
-                        base = curr
+                        base = chainbase = curr
                     e = (offset_type(offset, flags), l, textlen,
                          base, link, p1r, p2r, node)
                     self.index.insert(-1, e)
                     self.nodemap[node] = curr
                     entry = self._io.packentry(e, self.node, self.version, curr)
                     if not self._inline:
                         transaction.add(self.datafile, offset)
                         transaction.add(self.indexfile, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         dfh.flush()
                         ifh.write(entry)
                     else:
                         offset += curr * self._io.size
                         transaction.add(self.indexfile, offset, curr)
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                         self.checkinlinesize(transaction, ifh)
                     if type(text) == str: # only accept immutable objects
                         self._cache = (node, curr, text)
-                    self._basecache = (curr, base)
+                    self._basecache = (curr, chainbase)
                     return node
                 def group(self, nodelist, bundler):
                     """Calculate a delta group, yielding a sequence of changegroup chunks
                     (strings).
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. The first delta is
                     first parent(nodelist[0]) -> nodelist[0], the receiver is
                     guaranteed to have this parent as it has all history before
                     these changesets. In the case firstparent is nullrev the
                     changegroup starts with a full revision.
                     """
                     revs = sorted([self.rev(n) for n in nodelist])
                     # if we don't have any revisions touched by these changesets, bail
                     if not revs:
                         yield bundler.close()
                         return
                     # add the parent of the first rev
                     p = self.parentrevs(revs[0])[0]
                     revs.insert(0, p)
                     # build deltas
                     for r in xrange(len(revs) - 1):
                         prev, curr = revs[r], revs[r + 1]
                         for c in bundler.revchunk(self, curr, prev):
                             yield c
                     yield bundler.close()
                 def addgroup(self, bundle, linkmapper, transaction):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     """
                     # track the base of the current delta log
                     node = None
                     r = len(self)
                     end = 0
                     if r:
                         end = self.end(r - 1)
                     ifh = self.opener(self.indexfile, "a+")
                     isize = r * self._io.size
                     if self._inline:
                         transaction.add(self.indexfile, end + isize, r)
                         dfh = None
                     else:
                         transaction.add(self.indexfile, isize, r)
                         transaction.add(self.datafile, end)
                         dfh = self.opener(self.datafile, "a")
                     try:
                         # loop through our set of deltas
                         chain = None
                         while 1:
                             chunkdata = bundle.deltachunk(chain)
                             if not chunkdata:
                                 break
                             node = chunkdata['node']
                             p1 = chunkdata['p1']
                             p2 = chunkdata['p2']
                             cs = chunkdata['cs']
                             deltabase = chunkdata['deltabase']
                             delta = chunkdata['delta']
                             link = linkmapper(cs)
                             if node in self.nodemap:
                                 # this can happen if two branches make the same change
                                 chain = node
                                 continue
                             for p in (p1, p2):
                                 if not p in self.nodemap:
                                     raise LookupError(p, self.indexfile,
                                                       _('unknown parent'))
                             if deltabase not in self.nodemap:
                                 raise LookupError(deltabase, self.indexfile,
                                                   _('unknown delta base'))
                             baserev = self.rev(deltabase)
                             chain = self._addrevision(node, None, transaction, link,
                                                       p1, p2, (baserev, delta), ifh, dfh)
                             if not dfh and not self._inline:
                                 # addrevision switched from inline to conventional
                                 # reopen the index
                                 ifh.close()
                                 dfh = self.opener(self.datafile, "a")
                                 ifh = self.opener(self.indexfile, "a")
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                     return node
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll readd them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     for rev in self:
                         if self.index[rev][4] >= minlink:
                             break
                     else:
                         return
                     # first truncate the files on disk
                     end = self.start(rev)
                     if not self._inline:
                         transaction.add(self.datafile, end)
                         end = rev * self._io.size
                     else:
                         end += rev * self._io.size
                     transaction.add(self.indexfile, end)
                     # then reset internal state in memory to forget those revisions
                     self._cache = None
                     self._chunkclear()
                     for x in xrange(rev, len(self)):
                         del self.nodemap[self.node(x)]
                     del self.index[rev:-1]
                 def checksize(self):
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         f = self.opener(self.datafile)
                         f.seek(0, 2)
                         actual = f.tell()
                         f.close()
                         dd = actual - expected
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         dd = 0
                     try:
                         f = self.opener(self.indexfile)
                         f.seek(0, 2)
                         actual = f.tell()
                         f.close()
                         s = self._io.size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         di = 0
                     return (dd, di)
                 def files(self):
                     res = [self.indexfile]
                     if not self._inline:
                         res.append(self.datafile)
                     return res