upstream/mercurial-mirror Commit - r1941:75188237

1

"""

1

"""

2

revlog.py - storage back-end for mercurial

2

revlog.py - storage back-end for mercurial

3

4

This provides efficient delta storage with O(1) retrieve and append

4

This provides efficient delta storage with O(1) retrieve and append

5

and O(changes) merge between branches

5

and O(changes) merge between branches

6

7

8

9

This software may be used and distributed according to the terms

9

This software may be used and distributed according to the terms

10

of the GNU General Public License, incorporated herein by reference.

10

of the GNU General Public License, incorporated herein by reference.

11

"""

11

"""

12

13

from node import *

13

from node import *

14

from i18n import gettext as _

14

from i18n import gettext as _

15

from demandload import demandload

15

from demandload import demandload

16

demandload(globals(), "binascii errno heapq mdiff os sha struct zlib")

16

demandload(globals(), "binascii errno heapq mdiff os sha struct zlib")

17

18

def hash(text, p1, p2):

18

def hash(text, p1, p2):

19

"""generate a hash from the given text and its parent hashes

19

"""generate a hash from the given text and its parent hashes

20

21

This hash combines both the current file contents and its history

21

This hash combines both the current file contents and its history

22

in a manner that makes it easy to distinguish nodes with the same

22

in a manner that makes it easy to distinguish nodes with the same

23

content in the revision graph.

23

content in the revision graph.

24

"""

24

"""

25

l = [p1, p2]

25

l = [p1, p2]

26

l.sort()

26

l.sort()

27

s = sha.new(l[0])

27

s = sha.new(l[0])

28

s.update(l[1])

28

s.update(l[1])

29

s.update(text)

29

s.update(text)

30

return s.digest()

30

return s.digest()

31

32

def compress(text):

32

def compress(text):

33

""" generate a possibly-compressed representation of text """

33

""" generate a possibly-compressed representation of text """

34

if not text: return ("", text)

34

if not text: return ("", text)

35

if len(text) < 44:

35

if len(text) < 44:

36

if text[0] == '\0': return ("", text)

36

if text[0] == '\0': return ("", text)

37

return ('u', text)

37

return ('u', text)

38

bin = zlib.compress(text)

38

bin = zlib.compress(text)

39

if len(bin) > len(text):

39

if len(bin) > len(text):

40

if text[0] == '\0': return ("", text)

40

if text[0] == '\0': return ("", text)

41

return ('u', text)

41

return ('u', text)

42

return ("", bin)

42

return ("", bin)

43

44

def decompress(bin):

44

def decompress(bin):

45

""" decompress the given input """

45

""" decompress the given input """

46

if not bin: return bin

46

if not bin: return bin

47

t = bin[0]

47

t = bin[0]

48

if t == '\0': return bin

48

if t == '\0': return bin

49

if t == 'x': return zlib.decompress(bin)

49

if t == 'x': return zlib.decompress(bin)

50

if t == 'u': return bin[1:]

50

if t == 'u': return bin[1:]

51

raise RevlogError(_("unknown compression type %r") % t)

51

raise RevlogError(_("unknown compression type %r") % t)

52

53

indexformat = ">4l20s20s20s"

53

indexformat = ">4l20s20s20s"

54

55

class lazyparser(object):

55

class lazyparser(object):

56

"""

56

"""

57

this class avoids the need to parse the entirety of large indices

57

this class avoids the need to parse the entirety of large indices

58

59

By default we parse and load 1000 entries at a time.

59

By default we parse and load 1000 entries at a time.

60

61

If no position is specified, we load the whole index, and replace

61

If no position is specified, we load the whole index, and replace

62

the lazy objects in revlog with the underlying objects for

62

the lazy objects in revlog with the underlying objects for

63

efficiency in cases where we look at most of the nodes.

63

efficiency in cases where we look at most of the nodes.

64

"""

64

"""

65

def __init__(self, data, revlog):

65

def __init__(self, data, revlog):

66

self.data = data

66

self.data = data

67

self.s = struct.calcsize(indexformat)

67

self.s = struct.calcsize(indexformat)

68

self.l = len(data)/self.s

68

self.l = len(data)/self.s

69

self.index = [None] * self.l

69

self.index = [None] * self.l

70

self.map = {nullid: -1}

70

self.map = {nullid: -1}

71

self.all = 0

71

self.all = 0

72

self.revlog = revlog

72

self.revlog = revlog

73

74

def trunc(self, pos):

74

def trunc(self, pos):

75

self.l = pos/self.s

75

self.l = pos/self.s

76

77

def load(self, pos=None):

77

def load(self, pos=None):

78

if self.all: return

78

if self.all: return

79

if pos is not None:

79

if pos is not None:

80

block = pos / 1000

80

block = pos / 1000

81

i = block * 1000

81

i = block * 1000

82

end = min(self.l, i + 1000)

82

end = min(self.l, i + 1000)

83

else:

83

else:

84

self.all = 1

84

self.all = 1

85

i = 0

85

i = 0

86

end = self.l

86

end = self.l

87

self.revlog.index = self.index

87

self.revlog.index = self.index

88

self.revlog.nodemap = self.map

88

self.revlog.nodemap = self.map

89

90

while i < end:

90

while i < end:

91

d = self.data[i * self.s: (i + 1) * self.s]

91

d = self.data[i * self.s: (i + 1) * self.s]

92

e = struct.unpack(indexformat, d)

92

e = struct.unpack(indexformat, d)

93

self.index[i] = e

93

self.index[i] = e

94

self.map[e[6]] = i

94

self.map[e[6]] = i

95

i += 1

95

i += 1

96

97

class lazyindex(object):

97

class lazyindex(object):

98

"""a lazy version of the index array"""

98

"""a lazy version of the index array"""

99

def __init__(self, parser):

99

def __init__(self, parser):

100

self.p = parser

100

self.p = parser

101

def __len__(self):

101

def __len__(self):

102

return len(self.p.index)

102

return len(self.p.index)

103

def load(self, pos):

103

def load(self, pos):

104

if pos < 0:

104

if pos < 0:

105

pos += len(self.p.index)

105

pos += len(self.p.index)

106

self.p.load(pos)

106

self.p.load(pos)

107

return self.p.index[pos]

107

return self.p.index[pos]

108

def __getitem__(self, pos):

108

def __getitem__(self, pos):

109

return self.p.index[pos] or self.load(pos)

109

return self.p.index[pos] or self.load(pos)

110

def __delitem__(self, pos):

110

def __delitem__(self, pos):

111

del self.p.index[pos]

111

del self.p.index[pos]

112

def append(self, e):

112

def append(self, e):

113

self.p.index.append(e)

113

self.p.index.append(e)

114

def trunc(self, pos):

114

def trunc(self, pos):

115

self.p.trunc(pos)

115

self.p.trunc(pos)

116

117

class lazymap(object):

117

class lazymap(object):

118

"""a lazy version of the node map"""

118

"""a lazy version of the node map"""

119

def __init__(self, parser):

119

def __init__(self, parser):

120

self.p = parser

120

self.p = parser

121

def load(self, key):

121

def load(self, key):

122

if self.p.all: return

122

if self.p.all: return

123

n = self.p.data.find(key)

123

n = self.p.data.find(key)

124

if n < 0:

124

if n < 0:

125

raise KeyError(key)

125

raise KeyError(key)

126

pos = n / self.p.s

126

pos = n / self.p.s

127

self.p.load(pos)

127

self.p.load(pos)

128

def __contains__(self, key):

128

def __contains__(self, key):

129

self.p.load()

129

self.p.load()

130

return key in self.p.map

130

return key in self.p.map

131

def __iter__(self):

131

def __iter__(self):

132

yield nullid

132

yield nullid

133

for i in xrange(self.p.l):

133

for i in xrange(self.p.l):

134

try:

134

try:

135

yield self.p.index[i][6]

135

yield self.p.index[i][6]

136

except:

136

except:

137

self.p.load(i)

137

self.p.load(i)

138

yield self.p.index[i][6]

138

yield self.p.index[i][6]

139

def __getitem__(self, key):

139

def __getitem__(self, key):

140

try:

140

try:

141

return self.p.map[key]

141

return self.p.map[key]

142

except KeyError:

142

except KeyError:

143

try:

143

try:

144

self.load(key)

144

self.load(key)

145

return self.p.map[key]

145

return self.p.map[key]

146

except KeyError:

146

except KeyError:

147

raise KeyError("node " + hex(key))

147

raise KeyError("node " + hex(key))

148

def __setitem__(self, key, val):

148

def __setitem__(self, key, val):

149

self.p.map[key] = val

149

self.p.map[key] = val

150

def __delitem__(self, key):

150

def __delitem__(self, key):

151

del self.p.map[key]

151

del self.p.map[key]

152

153

class RevlogError(Exception): pass

153

class RevlogError(Exception): pass

154

155

class revlog(object):

155

class revlog(object):

156

"""

156

"""

157

the underlying revision storage object

157

the underlying revision storage object

158

159

A revlog consists of two parts, an index and the revision data.

159

A revlog consists of two parts, an index and the revision data.

160

161

The index is a file with a fixed record size containing

161

The index is a file with a fixed record size containing

162

information on each revision, includings its nodeid (hash), the

162

information on each revision, includings its nodeid (hash), the

163

nodeids of its parents, the position and offset of its data within

163

nodeids of its parents, the position and offset of its data within

164

the data file, and the revision it's based on. Finally, each entry

164

the data file, and the revision it's based on. Finally, each entry

165

contains a linkrev entry that can serve as a pointer to external

165

contains a linkrev entry that can serve as a pointer to external

166

data.

166

data.

167

168

The revision data itself is a linear collection of data chunks.

168

The revision data itself is a linear collection of data chunks.

169

Each chunk represents a revision and is usually represented as a

169

Each chunk represents a revision and is usually represented as a

170

delta against the previous chunk. To bound lookup time, runs of

170

delta against the previous chunk. To bound lookup time, runs of

171

deltas are limited to about 2 times the length of the original

171

deltas are limited to about 2 times the length of the original

172

version data. This makes retrieval of a version proportional to

172

version data. This makes retrieval of a version proportional to

173

its size, or O(1) relative to the number of revisions.

173

its size, or O(1) relative to the number of revisions.

174

175

Both pieces of the revlog are written to in an append-only

175

Both pieces of the revlog are written to in an append-only

176

fashion, which means we never need to rewrite a file to insert or

176

fashion, which means we never need to rewrite a file to insert or

177

remove data, and can use some simple techniques to avoid the need

177

remove data, and can use some simple techniques to avoid the need

178

for locking while reading.

178

for locking while reading.

179

"""

179

"""

180

def __init__(self, opener, indexfile, datafile):

180

def __init__(self, opener, indexfile, datafile):

181

"""

181

"""

182

create a revlog object

182

create a revlog object

183

184

opener is a function that abstracts the file opening operation

184

opener is a function that abstracts the file opening operation

185

and can be used to implement COW semantics or the like.

185

and can be used to implement COW semantics or the like.

186

"""

186

"""

187

self.indexfile = indexfile

187

self.indexfile = indexfile

188

self.datafile = datafile

188

self.datafile = datafile

189

self.opener = opener

189

self.opener = opener

190

191

self.indexstat = None

191

self.indexstat = None

192

self.cache = None

192

self.cache = None

193

self.chunkcache = None

193

self.chunkcache = None

194

self.load()

194

self.load()

195

196

def load(self):

196

def load(self):

197

try:

197

try:

198

f = self.opener(self.indexfile)

198

f = self.opener(self.indexfile)

199

except IOError, inst:

199

except IOError, inst:

200

if inst.errno != errno.ENOENT:

200

if inst.errno != errno.ENOENT:

201

raise

201

raise

202

i = ""

202

i = ""

203

else:

203

else:

204

try:

204

try:

205

st = os.fstat(f.fileno())

205

st = os.fstat(f.fileno())

206

except AttributeError, inst:

206

except AttributeError, inst:

207

st = None

207

st = None

208

else:

208

else:

209

oldst = self.indexstat

209

oldst = self.indexstat

210

if (oldst and st.st_dev == oldst.st_dev

210

if (oldst and st.st_dev == oldst.st_dev

211

and st.st_ino == oldst.st_ino

211

and st.st_ino == oldst.st_ino

212

and st.st_mtime == oldst.st_mtime

212

and st.st_mtime == oldst.st_mtime

213

and st.st_ctime == oldst.st_ctime):

213

and st.st_ctime == oldst.st_ctime):

214

return

214

return

215

self.indexstat = st

215

self.indexstat = st

216

i = f.read()

216

i = f.read()

217

218

if i and i[:4] != "\0\0\0\0":

218

if i and i[:4] != "\0\0\0\0":

219

raise RevlogError(_("incompatible revlog signature on %s") %

219

raise RevlogError(_("incompatible revlog signature on %s") %

220

self.indexfile)

220

self.indexfile)

221

222

if len(i) > 10000:

222

if len(i) > 10000:

223

# big index, let's parse it on demand

223

# big index, let's parse it on demand

224

parser = lazyparser(i, self)

224

parser = lazyparser(i, self)

225

self.index = lazyindex(parser)

225

self.index = lazyindex(parser)

226

self.nodemap = lazymap(parser)

226

self.nodemap = lazymap(parser)

227

else:

227

else:

228

s = struct.calcsize(indexformat)

228

s = struct.calcsize(indexformat)

229

l = len(i) / s

229

l = len(i) / s

230

self.index = [None] * l

230

self.index = [None] * l

231

m = [None] * l

231

m = [None] * l

232

233

n = 0

233

n = 0

234

for f in xrange(0, l * s, s):

234

for f in xrange(0, l * s, s):

235

# offset, size, base, linkrev, p1, p2, nodeid

235

# offset, size, base, linkrev, p1, p2, nodeid

236

e = struct.unpack(indexformat, i[f:f + s])

236

e = struct.unpack(indexformat, i[f:f + s])

237

m[n] = (e[6], n)

237

m[n] = (e[6], n)

238

self.index[n] = e

238

self.index[n] = e

239

n += 1

239

n += 1

240

241

self.nodemap = dict(m)

241

self.nodemap = dict(m)

242

self.nodemap[nullid] = -1

242

self.nodemap[nullid] = -1

243

244

def tip(self): return self.node(len(self.index) - 1)

244

def tip(self): return self.node(len(self.index) - 1)

245

def count(self): return len(self.index)

245

def count(self): return len(self.index)

246

def node(self, rev): return (rev < 0) and nullid or self.index[rev][6]

246

def node(self, rev): return (rev < 0) and nullid or self.index[rev][6]

247

def rev(self, node):

247

def rev(self, node):

248

try:

248

try:

249

return self.nodemap[node]

249

return self.nodemap[node]

250

except KeyError:

250

except KeyError:

251

raise RevlogError(_('%s: no node %s') % (self.indexfile, hex(node)))

251

raise RevlogError(_('%s: no node %s') % (self.indexfile, hex(node)))

252

def linkrev(self, node): return self.index[self.rev(node)][3]

252

def linkrev(self, node): return self.index[self.rev(node)][3]

253

def parents(self, node):

253

def parents(self, node):

254

if node == nullid: return (nullid, nullid)

254

if node == nullid: return (nullid, nullid)

255

return self.index[self.rev(node)][4:6]

255

return self.index[self.rev(node)][4:6]

256

257

def start(self, rev): return self.index[rev][0]

257

def start(self, rev): return (rev < 0) and -1 or self.index[rev][0]

258

def length(self, rev): ~~return~~ ~~self~~.~~index~~[~~rev~~][1]

258

def length(self, rev):

259

if rev < 0:

260

return 0

261

else:

262

return self.index[rev][1]

259

def end(self, rev): return self.start(rev) + self.length(rev)

263

def end(self, rev): return self.start(rev) + self.length(rev)

260

def base(self, rev): return self.index[rev][2]

264

def base(self, rev): return (rev < 0) and rev or self.index[rev][2]

261

265

262

def reachable(self, rev, stop=None):

266

def reachable(self, rev, stop=None):

263

reachable = {}

267

reachable = {}

264

visit = [rev]

268

visit = [rev]

265

reachable[rev] = 1

269

reachable[rev] = 1

266

if stop:

270

if stop:

267

stopn = self.rev(stop)

271

stopn = self.rev(stop)

268

else:

272

else:

269

stopn = 0

273

stopn = 0

270

while visit:

274

while visit:

271

n = visit.pop(0)

275

n = visit.pop(0)

272

if n == stop:

276

if n == stop:

273

continue

277

continue

274

if n == nullid:

278

if n == nullid:

275

continue

279

continue

276

for p in self.parents(n):

280

for p in self.parents(n):

277

if self.rev(p) < stopn:

281

if self.rev(p) < stopn:

278

continue

282

continue

279

if p not in reachable:

283

if p not in reachable:

280

reachable[p] = 1

284

reachable[p] = 1

281

visit.append(p)

285

visit.append(p)

282

return reachable

286

return reachable

283

287

284

def nodesbetween(self, roots=None, heads=None):

288

def nodesbetween(self, roots=None, heads=None):

285

"""Return a tuple containing three elements. Elements 1 and 2 contain

289

"""Return a tuple containing three elements. Elements 1 and 2 contain

286

a final list bases and heads after all the unreachable ones have been

290

a final list bases and heads after all the unreachable ones have been

287

pruned. Element 0 contains a topologically sorted list of all

291

pruned. Element 0 contains a topologically sorted list of all

288

292

289

nodes that satisfy these constraints:

293

nodes that satisfy these constraints:

290

1. All nodes must be descended from a node in roots (the nodes on

294

1. All nodes must be descended from a node in roots (the nodes on

291

roots are considered descended from themselves).

295

roots are considered descended from themselves).

292

2. All nodes must also be ancestors of a node in heads (the nodes in

296

2. All nodes must also be ancestors of a node in heads (the nodes in

293

heads are considered to be their own ancestors).

297

heads are considered to be their own ancestors).

294

298

295

If roots is unspecified, nullid is assumed as the only root.

299

If roots is unspecified, nullid is assumed as the only root.

296

If heads is unspecified, it is taken to be the output of the

300

If heads is unspecified, it is taken to be the output of the

297

heads method (i.e. a list of all nodes in the repository that

301

heads method (i.e. a list of all nodes in the repository that

298

have no children)."""

302

have no children)."""

299

nonodes = ([], [], [])

303

nonodes = ([], [], [])

300

if roots is not None:

304

if roots is not None:

301

roots = list(roots)

305

roots = list(roots)

302

if not roots:

306

if not roots:

303

return nonodes

307

return nonodes

304

lowestrev = min([self.rev(n) for n in roots])

308

lowestrev = min([self.rev(n) for n in roots])

305

else:

309

else:

306

roots = [nullid] # Everybody's a descendent of nullid

310

roots = [nullid] # Everybody's a descendent of nullid

307

lowestrev = -1

311

lowestrev = -1

308

if (lowestrev == -1) and (heads is None):

312

if (lowestrev == -1) and (heads is None):

309

# We want _all_ the nodes!

313

# We want _all_ the nodes!

310

return ([self.node(r) for r in xrange(0, self.count())],

314

return ([self.node(r) for r in xrange(0, self.count())],

311

[nullid], list(self.heads()))

315

[nullid], list(self.heads()))

312

if heads is None:

316

if heads is None:

313

# All nodes are ancestors, so the latest ancestor is the last

317

# All nodes are ancestors, so the latest ancestor is the last

314

# node.

318

# node.

315

highestrev = self.count() - 1

319

highestrev = self.count() - 1

316

# Set ancestors to None to signal that every node is an ancestor.

320

# Set ancestors to None to signal that every node is an ancestor.

317

ancestors = None

321

ancestors = None

318

# Set heads to an empty dictionary for later discovery of heads

322

# Set heads to an empty dictionary for later discovery of heads

319

heads = {}

323

heads = {}

320

else:

324

else:

321

heads = list(heads)

325

heads = list(heads)

322

if not heads:

326

if not heads:

323

return nonodes

327

return nonodes

324

ancestors = {}

328

ancestors = {}

325

# Start at the top and keep marking parents until we're done.

329

# Start at the top and keep marking parents until we're done.

326

nodestotag = heads[:]

330

nodestotag = heads[:]

327

# Turn heads into a dictionary so we can remove 'fake' heads.

331

# Turn heads into a dictionary so we can remove 'fake' heads.

328

# Also, later we will be using it to filter out the heads we can't

332

# Also, later we will be using it to filter out the heads we can't

329

# find from roots.

333

# find from roots.

330

heads = dict.fromkeys(heads, 0)

334

heads = dict.fromkeys(heads, 0)

331

# Remember where the top was so we can use it as a limit later.

335

# Remember where the top was so we can use it as a limit later.

332

highestrev = max([self.rev(n) for n in nodestotag])

336

highestrev = max([self.rev(n) for n in nodestotag])

333

while nodestotag:

337

while nodestotag:

334

# grab a node to tag

338

# grab a node to tag

335

n = nodestotag.pop()

339

n = nodestotag.pop()

336

# Never tag nullid

340

# Never tag nullid

337

if n == nullid:

341

if n == nullid:

338

continue

342

continue

339

# A node's revision number represents its place in a

343

# A node's revision number represents its place in a

340

# topologically sorted list of nodes.

344

# topologically sorted list of nodes.

341

r = self.rev(n)

345

r = self.rev(n)

342

if r >= lowestrev:

346

if r >= lowestrev:

343

if n not in ancestors:

347

if n not in ancestors:

344

# If we are possibly a descendent of one of the roots

348

# If we are possibly a descendent of one of the roots

345

# and we haven't already been marked as an ancestor

349

# and we haven't already been marked as an ancestor

346

ancestors[n] = 1 # Mark as ancestor

350

ancestors[n] = 1 # Mark as ancestor

347

# Add non-nullid parents to list of nodes to tag.

351

# Add non-nullid parents to list of nodes to tag.

348

nodestotag.extend([p for p in self.parents(n) if

352

nodestotag.extend([p for p in self.parents(n) if

349

p != nullid])

353

p != nullid])

350

elif n in heads: # We've seen it before, is it a fake head?

354

elif n in heads: # We've seen it before, is it a fake head?

351

# So it is, real heads should not be the ancestors of

355

# So it is, real heads should not be the ancestors of

352

# any other heads.

356

# any other heads.

353

heads.pop(n)

357

heads.pop(n)

354

if not ancestors:

358

if not ancestors:

355

return nonodes

359

return nonodes

356

# Now that we have our set of ancestors, we want to remove any

360

# Now that we have our set of ancestors, we want to remove any

357

# roots that are not ancestors.

361

# roots that are not ancestors.

358

362

359

# If one of the roots was nullid, everything is included anyway.

363

# If one of the roots was nullid, everything is included anyway.

360

if lowestrev > -1:

364

if lowestrev > -1:

361

# But, since we weren't, let's recompute the lowest rev to not

365

# But, since we weren't, let's recompute the lowest rev to not

362

# include roots that aren't ancestors.

366

# include roots that aren't ancestors.

363

367

364

# Filter out roots that aren't ancestors of heads

368

# Filter out roots that aren't ancestors of heads

365

roots = [n for n in roots if n in ancestors]

369

roots = [n for n in roots if n in ancestors]

366

# Recompute the lowest revision

370

# Recompute the lowest revision

367

if roots:

371

if roots:

368

lowestrev = min([self.rev(n) for n in roots])

372

lowestrev = min([self.rev(n) for n in roots])

369

else:

373

else:

370

# No more roots? Return empty list

374

# No more roots? Return empty list

371

return nonodes

375

return nonodes

372

else:

376

else:

373

# We are descending from nullid, and don't need to care about

377

# We are descending from nullid, and don't need to care about

374

# any other roots.

378

# any other roots.

375

lowestrev = -1

379

lowestrev = -1

376

roots = [nullid]

380

roots = [nullid]

377

# Transform our roots list into a 'set' (i.e. a dictionary where the

381

# Transform our roots list into a 'set' (i.e. a dictionary where the

378

# values don't matter.

382

# values don't matter.

379

descendents = dict.fromkeys(roots, 1)

383

descendents = dict.fromkeys(roots, 1)

380

# Also, keep the original roots so we can filter out roots that aren't

384

# Also, keep the original roots so we can filter out roots that aren't

381

# 'real' roots (i.e. are descended from other roots).

385

# 'real' roots (i.e. are descended from other roots).

382

roots = descendents.copy()

386

roots = descendents.copy()

383

# Our topologically sorted list of output nodes.

387

# Our topologically sorted list of output nodes.

384

orderedout = []

388

orderedout = []

385

# Don't start at nullid since we don't want nullid in our output list,

389

# Don't start at nullid since we don't want nullid in our output list,

386

# and if nullid shows up in descedents, empty parents will look like

390

# and if nullid shows up in descedents, empty parents will look like

387

# they're descendents.

391

# they're descendents.

388

for r in xrange(max(lowestrev, 0), highestrev + 1):

392

for r in xrange(max(lowestrev, 0), highestrev + 1):

389

n = self.node(r)

393

n = self.node(r)

390

isdescendent = False

394

isdescendent = False

391

if lowestrev == -1: # Everybody is a descendent of nullid

395

if lowestrev == -1: # Everybody is a descendent of nullid

392

isdescendent = True

396

isdescendent = True

393

elif n in descendents:

397

elif n in descendents:

394

# n is already a descendent

398

# n is already a descendent

395

isdescendent = True

399

isdescendent = True

396

# This check only needs to be done here because all the roots

400

# This check only needs to be done here because all the roots

397

# will start being marked is descendents before the loop.

401

# will start being marked is descendents before the loop.

398

if n in roots:

402

if n in roots:

399

# If n was a root, check if it's a 'real' root.

403

# If n was a root, check if it's a 'real' root.

400

p = tuple(self.parents(n))

404

p = tuple(self.parents(n))

401

# If any of its parents are descendents, it's not a root.

405

# If any of its parents are descendents, it's not a root.

402

if (p[0] in descendents) or (p[1] in descendents):

406

if (p[0] in descendents) or (p[1] in descendents):

403

roots.pop(n)

407

roots.pop(n)

404

else:

408

else:

405

p = tuple(self.parents(n))

409

p = tuple(self.parents(n))

406

# A node is a descendent if either of its parents are

410

# A node is a descendent if either of its parents are

407

# descendents. (We seeded the dependents list with the roots

411

# descendents. (We seeded the dependents list with the roots

408

# up there, remember?)

412

# up there, remember?)

409

if (p[0] in descendents) or (p[1] in descendents):

413

if (p[0] in descendents) or (p[1] in descendents):

410

descendents[n] = 1

414

descendents[n] = 1

411

isdescendent = True

415

isdescendent = True

412

if isdescendent and ((ancestors is None) or (n in ancestors)):

416

if isdescendent and ((ancestors is None) or (n in ancestors)):

413

# Only include nodes that are both descendents and ancestors.

417

# Only include nodes that are both descendents and ancestors.

414

orderedout.append(n)

418

orderedout.append(n)

415

if (ancestors is not None) and (n in heads):

419

if (ancestors is not None) and (n in heads):

416

# We're trying to figure out which heads are reachable

420

# We're trying to figure out which heads are reachable

417

# from roots.

421

# from roots.

418

# Mark this head as having been reached

422

# Mark this head as having been reached

419

heads[n] = 1

423

heads[n] = 1

420

elif ancestors is None:

424

elif ancestors is None:

421

# Otherwise, we're trying to discover the heads.

425

# Otherwise, we're trying to discover the heads.

422

# Assume this is a head because if it isn't, the next step

426

# Assume this is a head because if it isn't, the next step

423

# will eventually remove it.

427

# will eventually remove it.

424

heads[n] = 1

428

heads[n] = 1

425

# But, obviously its parents aren't.

429

# But, obviously its parents aren't.

426

for p in self.parents(n):

430

for p in self.parents(n):

427

heads.pop(p, None)

431

heads.pop(p, None)

428

heads = [n for n in heads.iterkeys() if heads[n] != 0]

432

heads = [n for n in heads.iterkeys() if heads[n] != 0]

429

roots = roots.keys()

433

roots = roots.keys()

430

assert orderedout

434

assert orderedout

431

assert roots

435

assert roots

432

assert heads

436

assert heads

433

return (orderedout, roots, heads)

437

return (orderedout, roots, heads)

434

438

435

def heads(self, start=None):

439

def heads(self, start=None):

436

"""return the list of all nodes that have no children

440

"""return the list of all nodes that have no children

437

441

438

if start is specified, only heads that are descendants of

442

if start is specified, only heads that are descendants of

439

start will be returned

443

start will be returned

440

444

441

"""

445

"""

442

if start is None:

446

if start is None:

443

start = nullid

447

start = nullid

444

reachable = {start: 1}

448

reachable = {start: 1}

445

heads = {start: 1}

449

heads = {start: 1}

446

startrev = self.rev(start)

450

startrev = self.rev(start)

447

451

448

for r in xrange(startrev + 1, self.count()):

452

for r in xrange(startrev + 1, self.count()):

449

n = self.node(r)

453

n = self.node(r)

450

for pn in self.parents(n):

454

for pn in self.parents(n):

451

if pn in reachable:

455

if pn in reachable:

452

reachable[n] = 1

456

reachable[n] = 1

453

heads[n] = 1

457

heads[n] = 1

454

if pn in heads:

458

if pn in heads:

455

del heads[pn]

459

del heads[pn]

456

return heads.keys()

460

return heads.keys()

457

461

458

def children(self, node):

462

def children(self, node):

459

"""find the children of a given node"""

463

"""find the children of a given node"""

460

c = []

464

c = []

461

p = self.rev(node)

465

p = self.rev(node)

462

for r in range(p + 1, self.count()):

466

for r in range(p + 1, self.count()):

463

n = self.node(r)

467

n = self.node(r)

464

for pn in self.parents(n):

468

for pn in self.parents(n):

465

if pn == node:

469

if pn == node:

466

c.append(n)

470

c.append(n)

467

continue

471

continue

468

elif pn == nullid:

472

elif pn == nullid:

469

continue

473

continue

470

return c

474

return c

471

475

472

def lookup(self, id):

476

def lookup(self, id):

473

"""locate a node based on revision number or subset of hex nodeid"""

477

"""locate a node based on revision number or subset of hex nodeid"""

474

try:

478

try:

475

rev = int(id)

479

rev = int(id)

476

if str(rev) != id: raise ValueError

480

if str(rev) != id: raise ValueError

477

if rev < 0: rev = self.count() + rev

481

if rev < 0: rev = self.count() + rev

478

if rev < 0 or rev >= self.count(): raise ValueError

482

if rev < 0 or rev >= self.count(): raise ValueError

479

return self.node(rev)

483

return self.node(rev)

480

except (ValueError, OverflowError):

484

except (ValueError, OverflowError):

481

c = []

485

c = []

482

for n in self.nodemap:

486

for n in self.nodemap:

483

if hex(n).startswith(id):

487

if hex(n).startswith(id):

484

c.append(n)

488

c.append(n)

485

if len(c) > 1: raise RevlogError(_("Ambiguous identifier"))

489

if len(c) > 1: raise RevlogError(_("Ambiguous identifier"))

486

if len(c) < 1: raise RevlogError(_("No match found"))

490

if len(c) < 1: raise RevlogError(_("No match found"))

487

return c[0]

491

return c[0]

488

492

489

return None

493

return None

490

494

491

def diff(self, a, b):

495

def diff(self, a, b):

492

"""return a delta between two revisions"""

496

"""return a delta between two revisions"""

493

return mdiff.textdiff(a, b)

497

return mdiff.textdiff(a, b)

494

498

495

def patches(self, t, pl):

499

def patches(self, t, pl):

496

"""apply a list of patches to a string"""

500

"""apply a list of patches to a string"""

497

return mdiff.patches(t, pl)

501

return mdiff.patches(t, pl)

498

502

499

def chunk(self, rev):

503

def chunk(self, rev):

500

start, length = self.start(rev), self.length(rev)

504

start, length = self.start(rev), self.length(rev)

501

end = start + length

505

end = start + length

502

506

503

def loadcache():

507

def loadcache():

504

cache_length = max(4096 * 1024, length) # 4Mo

508

cache_length = max(4096 * 1024, length) # 4Mo

505

df = self.opener(self.datafile)

509

df = self.opener(self.datafile)

506

df.seek(start)

510

df.seek(start)

507

self.chunkcache = (start, df.read(cache_length))

511

self.chunkcache = (start, df.read(cache_length))

508

512

509

if not self.chunkcache:

513

if not self.chunkcache:

510

loadcache()

514

loadcache()

511

515

512

cache_start = self.chunkcache[0]

516

cache_start = self.chunkcache[0]

513

cache_end = cache_start + len(self.chunkcache[1])

517

cache_end = cache_start + len(self.chunkcache[1])

514

if start >= cache_start and end <= cache_end:

518

if start >= cache_start and end <= cache_end:

515

# it is cached

519

# it is cached

516

offset = start - cache_start

520

offset = start - cache_start

517

else:

521

else:

518

loadcache()

522

loadcache()

519

offset = 0

523

offset = 0

520

524

521

#def checkchunk():

525

#def checkchunk():

522

# df = self.opener(self.datafile)

526

# df = self.opener(self.datafile)

523

# df.seek(start)

527

# df.seek(start)

524

# return df.read(length)

528

# return df.read(length)

525

#assert s == checkchunk()

529

#assert s == checkchunk()

526

return decompress(self.chunkcache[1][offset:offset + length])

530

return decompress(self.chunkcache[1][offset:offset + length])

527

531

528

def delta(self, node):

532

def delta(self, node):

529

"""return or calculate a delta between a node and its predecessor"""

533

"""return or calculate a delta between a node and its predecessor"""

530

r = self.rev(node)

534

r = self.rev(node)

531

b = self.base(r)

535

return self.revdiff(r - 1, r)

532

if r == b:

536

533

return self.diff(self.revision(self.node(r - 1)),

537

def revdiff(self, rev1, rev2):

534

self.revision(node))

538

"""return or calculate a delta between two revisions"""

539

b1 = self.base(rev1)

540

b2 = self.base(rev2)

541

if b1 == b2 and rev1 + 1 == rev2:

542

return self.chunk(rev2)

535

else:

543

else:

536

return self.~~chunk~~(r)

544

return self.diff(self.revision(self.node(rev1)),

545

self.revision(self.node(rev2)))

537

546

538

def revision(self, node):

547

def revision(self, node):

539

"""return an uncompressed revision of a given"""

548

"""return an uncompressed revision of a given"""

540

if node == nullid: return ""

549

if node == nullid: return ""

541

if self.cache and self.cache[0] == node: return self.cache[2]

550

if self.cache and self.cache[0] == node: return self.cache[2]

542

551

543

# look up what we need to read

552

# look up what we need to read

544

text = None

553

text = None

545

rev = self.rev(node)

554

rev = self.rev(node)

546

base = self.base(rev)

555

base = self.base(rev)

547

556

548

# do we have useful data cached?

557

# do we have useful data cached?

549

if self.cache and self.cache[1] >= base and self.cache[1] < rev:

558

if self.cache and self.cache[1] >= base and self.cache[1] < rev:

550

base = self.cache[1]

559

base = self.cache[1]

551

text = self.cache[2]

560

text = self.cache[2]

552

else:

561

else:

553

text = self.chunk(base)

562

text = self.chunk(base)

554

563

555

bins = []

564

bins = []

556

for r in xrange(base + 1, rev + 1):

565

for r in xrange(base + 1, rev + 1):

557

bins.append(self.chunk(r))

566

bins.append(self.chunk(r))

558

567

559

text = ~~mdif~~f.patches(text, bins)

568

text = self.patches(text, bins)

560

569

561

p1, p2 = self.parents(node)

570

p1, p2 = self.parents(node)

562

if node != hash(text, p1, p2):

571

if node != hash(text, p1, p2):

563

raise RevlogError(_("integrity check failed on %s:%d")

572

raise RevlogError(_("integrity check failed on %s:%d")

564

% (self.datafile, rev))

573

% (self.datafile, rev))

565

574

566

self.cache = (node, rev, text)

575

self.cache = (node, rev, text)

567

return text

576

return text

568

577

569

def addrevision(self, text, transaction, link, p1=None, p2=None, d=None):

578

def addrevision(self, text, transaction, link, p1=None, p2=None, d=None):

570

"""add a revision to the log

579

"""add a revision to the log

571

580

572

text - the revision data to add

581

text - the revision data to add

573

transaction - the transaction object used for rollback

582

transaction - the transaction object used for rollback

574

link - the linkrev data to add

583

link - the linkrev data to add

575

p1, p2 - the parent nodeids of the revision

584

p1, p2 - the parent nodeids of the revision

576

d - an optional precomputed delta

585

d - an optional precomputed delta

577

"""

586

"""

578

if text is None: text = ""

587

if text is None: text = ""

579

if p1 is None: p1 = self.tip()

588

if p1 is None: p1 = self.tip()

580

if p2 is None: p2 = nullid

589

if p2 is None: p2 = nullid

581

590

582

node = hash(text, p1, p2)

591

node = hash(text, p1, p2)

583

592

584

if node in self.nodemap:

593

if node in self.nodemap:

585

return node

594

return node

586

595

587

n = self.count()

596

n = self.count()

588

t = n - 1

597

t = n - 1

589

598

590

if n:

599

if n:

591

base = self.base(t)

600

base = self.base(t)

592

start = self.start(base)

601

start = self.start(base)

593

end = self.end(t)

602

end = self.end(t)

594

if not d:

603

if not d:

595

prev = self.revision(self.tip())

604

prev = self.revision(self.tip())

596

d = self.diff(prev, str(text))

605

d = self.diff(prev, str(text))

597

data = compress(d)

606

data = compress(d)

598

l = len(data[1]) + len(data[0])

607

l = len(data[1]) + len(data[0])

599

dist = end - start + l

608

dist = end - start + l

600

609

601

# full versions are inserted when the needed deltas

610

# full versions are inserted when the needed deltas

602

# become comparable to the uncompressed text

611

# become comparable to the uncompressed text

603

if not n or dist > len(text) * 2:

612

if not n or dist > len(text) * 2:

604

data = compress(text)

613

data = compress(text)

605

l = len(data[1]) + len(data[0])

614

l = len(data[1]) + len(data[0])

606

base = n

615

base = n

607

else:

616

else:

608

base = self.base(t)

617

base = self.base(t)

609

618

610

offset = 0

619

offset = 0

611

if t >= 0:

620

if t >= 0:

612

offset = self.end(t)

621

offset = self.end(t)

613

622

614

e = (offset, l, base, link, p1, p2, node)

623

e = (offset, l, base, link, p1, p2, node)

615

624

616

self.index.append(e)

625

self.index.append(e)

617

self.nodemap[node] = n

626

self.nodemap[node] = n

618

entry = struct.pack(indexformat, *e)

627

entry = struct.pack(indexformat, *e)

619

628

620

transaction.add(self.datafile, e[0])

629

transaction.add(self.datafile, e[0])

621

f = self.opener(self.datafile, "a")

630

f = self.opener(self.datafile, "a")

622

if data[0]:

631

if data[0]:

623

f.write(data[0])

632

f.write(data[0])

624

f.write(data[1])

633

f.write(data[1])

625

transaction.add(self.indexfile, n * len(entry))

634

transaction.add(self.indexfile, n * len(entry))

626

self.opener(self.indexfile, "a").write(entry)

635

self.opener(self.indexfile, "a").write(entry)

627

636

628

self.cache = (node, n, text)

637

self.cache = (node, n, text)

629

return node

638

return node

630

639

631

def ancestor(self, a, b):

640

def ancestor(self, a, b):

632

"""calculate the least common ancestor of nodes a and b"""

641

"""calculate the least common ancestor of nodes a and b"""

633

# calculate the distance of every node from root

642

# calculate the distance of every node from root

634

dist = {nullid: 0}

643

dist = {nullid: 0}

635

for i in xrange(self.count()):

644

for i in xrange(self.count()):

636

n = self.node(i)

645

n = self.node(i)

637

p1, p2 = self.parents(n)

646

p1, p2 = self.parents(n)

638

dist[n] = max(dist[p1], dist[p2]) + 1

647

dist[n] = max(dist[p1], dist[p2]) + 1

639

648

640

# traverse ancestors in order of decreasing distance from root

649

# traverse ancestors in order of decreasing distance from root

641

def ancestors(node):

650

def ancestors(node):

642

# we store negative distances because heap returns smallest member

651

# we store negative distances because heap returns smallest member

643

h = [(-dist[node], node)]

652

h = [(-dist[node], node)]

644

seen = {}

653

seen = {}

645

while h:

654

while h:

646

d, n = heapq.heappop(h)

655

d, n = heapq.heappop(h)

647

if n not in seen:

656

if n not in seen:

648

seen[n] = 1

657

seen[n] = 1

649

yield (-d, n)

658

yield (-d, n)

650

for p in self.parents(n):

659

for p in self.parents(n):

651

heapq.heappush(h, (-dist[p], p))

660

heapq.heappush(h, (-dist[p], p))

652

661

653

def generations(node):

662

def generations(node):

654

sg, s = None, {}

663

sg, s = None, {}

655

for g,n in ancestors(node):

664

for g,n in ancestors(node):

656

if g != sg:

665

if g != sg:

657

if sg:

666

if sg:

658

yield sg, s

667

yield sg, s

659

sg, s = g, {n:1}

668

sg, s = g, {n:1}

660

else:

669

else:

661

s[n] = 1

670

s[n] = 1

662

yield sg, s

671

yield sg, s

663

672

664

x = generations(a)

673

x = generations(a)

665

y = generations(b)

674

y = generations(b)

666

gx = x.next()

675

gx = x.next()

667

gy = y.next()

676

gy = y.next()

668

677

669

# increment each ancestor list until it is closer to root than

678

# increment each ancestor list until it is closer to root than

670

# the other, or they match

679

# the other, or they match

671

while 1:

680

while 1:

672

#print "ancestor gen %s %s" % (gx[0], gy[0])

681

#print "ancestor gen %s %s" % (gx[0], gy[0])

673

if gx[0] == gy[0]:

682

if gx[0] == gy[0]:

674

# find the intersection

683

# find the intersection

675

i = [ n for n in gx[1] if n in gy[1] ]

684

i = [ n for n in gx[1] if n in gy[1] ]

676

if i:

685

if i:

677

return i[0]

686

return i[0]

678

else:

687

else:

679

#print "next"

688

#print "next"

680

gy = y.next()

689

gy = y.next()

681

gx = x.next()

690

gx = x.next()

682

elif gx[0] < gy[0]:

691

elif gx[0] < gy[0]:

683

#print "next y"

692

#print "next y"

684

gy = y.next()

693

gy = y.next()

685

else:

694

else:

686

#print "next x"

695

#print "next x"

687

gx = x.next()

696

gx = x.next()

688

697

689

def group(self, nodelist, lookup, infocollect=None):

698

def group(self, nodelist, lookup, infocollect=None):

690

"""calculate a delta group

699

"""calculate a delta group

691

700

692

Given a list of changeset revs, return a set of deltas and

701

Given a list of changeset revs, return a set of deltas and

693

metadata corresponding to nodes. the first delta is

702

metadata corresponding to nodes. the first delta is

694

parent(nodes[0]) -> nodes[0] the receiver is guaranteed to

703

parent(nodes[0]) -> nodes[0] the receiver is guaranteed to

695

have this parent as it has all history before these

704

have this parent as it has all history before these

696

changesets. parent is parent[0]

705

changesets. parent is parent[0]

697

"""

706

"""

698

revs = [self.rev(n) for n in nodelist]

707

revs = [self.rev(n) for n in nodelist]

699

708

700

# if we don't have any revisions touched by these changesets, bail

709

# if we don't have any revisions touched by these changesets, bail

701

if not revs:

710

if not revs:

702

yield struct.pack(">l", 0)

711

yield struct.pack(">l", 0)

703

return

712

return

704

713

705

# add the parent of the first rev

714

# add the parent of the first rev

706

p = self.parents(self.node(revs[0]))[0]

715

p = self.parents(self.node(revs[0]))[0]

707

revs.insert(0, self.rev(p))

716

revs.insert(0, self.rev(p))

708

717

709

# build deltas

718

# build deltas

710

for d in xrange(0, len(revs) - 1):

719

for d in xrange(0, len(revs) - 1):

711

a, b = revs[d], revs[d + 1]

720

a, b = revs[d], revs[d + 1]

712

na = self.node(a)

713

nb = self.node(b)

721

nb = self.node(b)

714

722

715

if infocollect is not None:

723

if infocollect is not None:

716

infocollect(nb)

724

infocollect(nb)

717

725

718

# do we need to construct a new delta?

726

d = self.revdiff(a, b)

719

if a + 1 != b or self.base(b) == b:

720

ta = self.revision(na)

721

tb = self.revision(nb)

722

d = self.diff(ta, tb)

723

else:

724

d = self.chunk(b)

725

726

p = self.parents(nb)

727

p = self.parents(nb)

727

meta = nb + p[0] + p[1] + lookup(nb)

728

meta = nb + p[0] + p[1] + lookup(nb)

728

l = struct.pack(">l", len(meta) + len(d) + 4)

729

l = struct.pack(">l", len(meta) + len(d) + 4)

729

yield l

730

yield l

730

yield meta

731

yield meta

731

yield d

732

yield d

732

733

yield struct.pack(">l", 0)

734

yield struct.pack(">l", 0)

734

735

def addgroup(self, revs, linkmapper, transaction, unique=0):

736

def addgroup(self, revs, linkmapper, transaction, unique=0):

736

"""

737

"""

737

add a delta group

738

add a delta group

738

739

given a set of deltas, add them to the revision log. the

740

given a set of deltas, add them to the revision log. the

740

first delta is against its parent, which should be in our

741

first delta is against its parent, which should be in our

741

log, the rest are against the previous delta.

742

log, the rest are against the previous delta.

742

"""

743

"""

743

744

#track the base of the current delta log

745

#track the base of the current delta log

745

r = self.count()

746

r = self.count()

746

t = r - 1

747

t = r - 1

747

node = nullid

748

node = nullid

748

749

base = prev = -1

750

base = prev = -1

750

start = end = measure = 0

751

start = end = measure = 0

751

if r:

752

if r:

752

base = self.base(t)

753

base = self.base(t)

753

start = self.start(base)

754

start = self.start(base)

754

end = self.end(t)

755

end = self.end(t)

755

measure = self.length(base)

756

measure = self.length(base)

756

prev = self.tip()

757

prev = self.tip()

757

758

transaction.add(self.datafile, end)

759

transaction.add(self.datafile, end)

759

transaction.add(self.indexfile, r * struct.calcsize(indexformat))

760

transaction.add(self.indexfile, r * struct.calcsize(indexformat))

760

dfh = self.opener(self.datafile, "a")

761

dfh = self.opener(self.datafile, "a")

761

ifh = self.opener(self.indexfile, "a")

762

ifh = self.opener(self.indexfile, "a")

762

763

# loop through our set of deltas

764

# loop through our set of deltas

764

chain = None

765

chain = None

765

for chunk in revs:

766

for chunk in revs:

766

node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80])

767

node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80])

767

link = linkmapper(cs)

768

link = linkmapper(cs)

768

if node in self.nodemap:

769

if node in self.nodemap:

769

# this can happen if two branches make the same change

770

# this can happen if two branches make the same change

770

# if unique:

771

# if unique:

771

# raise RevlogError(_("already have %s") % hex(node[:4]))

772

# raise RevlogError(_("already have %s") % hex(node[:4]))

772

chain = node

773

chain = node

773

continue

774

continue

774

delta = chunk[80:]

775

delta = chunk[80:]

775

776

for p in (p1, p2):

777

for p in (p1, p2):

777

if not p in self.nodemap:

778

if not p in self.nodemap:

778

raise RevlogError(_("unknown parent %s") % short(p1))

779

raise RevlogError(_("unknown parent %s") % short(p1))

779

780

if not chain:

781

if not chain:

781

# retrieve the parent revision of the delta chain

782

# retrieve the parent revision of the delta chain

782

chain = p1

783

chain = p1

783

if not chain in self.nodemap:

784

if not chain in self.nodemap:

784

raise RevlogError(_("unknown base %s") % short(chain[:4]))

785

raise RevlogError(_("unknown base %s") % short(chain[:4]))

785

786

# full versions are inserted when the needed deltas become

787

# full versions are inserted when the needed deltas become

787

# comparable to the uncompressed text or when the previous

788

# comparable to the uncompressed text or when the previous

788

# version is not the one we have a delta against. We use

789

# version is not the one we have a delta against. We use

789

# the size of the previous full rev as a proxy for the

790

# the size of the previous full rev as a proxy for the

790

# current size.

791

# current size.

791

792

if chain == prev:

793

if chain == prev:

793

tempd = compress(delta)

794

tempd = compress(delta)

794

cdelta = tempd[0] + tempd[1]

795

cdelta = tempd[0] + tempd[1]

795

796

if chain != prev or (end - start + len(cdelta)) > measure * 2:

797

if chain != prev or (end - start + len(cdelta)) > measure * 2:

797

# flush our writes here so we can read it in revision

798

# flush our writes here so we can read it in revision

798

dfh.flush()

799

dfh.flush()

799

ifh.flush()

800

ifh.flush()

800

text = self.revision(chain)

801

text = self.revision(chain)

801

text = self.patches(text, [delta])

802

text = self.patches(text, [delta])

802

chk = self.addrevision(text, transaction, link, p1, p2)

803

chk = self.addrevision(text, transaction, link, p1, p2)

803

if chk != node:

804

if chk != node:

804

raise RevlogError(_("consistency error adding group"))

805

raise RevlogError(_("consistency error adding group"))

805

measure = len(text)

806

measure = len(text)

806

else:

807

else:

807

e = (end, len(cdelta), base, link, p1, p2, node)

808

e = (end, len(cdelta), base, link, p1, p2, node)

808

self.index.append(e)

809

self.index.append(e)

809

self.nodemap[node] = r

810

self.nodemap[node] = r

810

dfh.write(cdelta)

811

dfh.write(cdelta)

811

ifh.write(struct.pack(indexformat, *e))

812

ifh.write(struct.pack(indexformat, *e))

812

813

t, r, chain, prev = r, r + 1, node, node

814

t, r, chain, prev = r, r + 1, node, node

814

base = self.base(t)

815

base = self.base(t)

815

start = self.start(base)

816

start = self.start(base)

816

end = self.end(t)

817

end = self.end(t)

817

818

dfh.close()

819

dfh.close()

819

ifh.close()

820

ifh.close()

820

return node

821

return node

821

822

def strip(self, rev, minlink):

823

def strip(self, rev, minlink):

823

if self.count() == 0 or rev >= self.count():

824

if self.count() == 0 or rev >= self.count():

824

return

825

return

825

826

# When stripping away a revision, we need to make sure it

827

# When stripping away a revision, we need to make sure it

827

# does not actually belong to an older changeset.

828

# does not actually belong to an older changeset.

828

# The minlink parameter defines the oldest revision

829

# The minlink parameter defines the oldest revision

829

# we're allowed to strip away.

830

# we're allowed to strip away.

830

while minlink > self.index[rev][3]:

831

while minlink > self.index[rev][3]:

831

rev += 1

832

rev += 1

832

if rev >= self.count():

833

if rev >= self.count():

833

return

834

return

834

835

# first truncate the files on disk

836

# first truncate the files on disk

836

end = self.start(rev)

837

end = self.start(rev)

837

self.opener(self.datafile, "a").truncate(end)

838

self.opener(self.datafile, "a").truncate(end)

838

end = rev * struct.calcsize(indexformat)

839

end = rev * struct.calcsize(indexformat)

839

self.opener(self.indexfile, "a").truncate(end)

840

self.opener(self.indexfile, "a").truncate(end)

840

841

# then reset internal state in memory to forget those revisions

842

# then reset internal state in memory to forget those revisions

842

self.cache = None

843

self.cache = None

843

self.chunkcache = None

844

self.chunkcache = None

844

for p in self.index[rev:]:

845

for p in self.index[rev:]:

845

del self.nodemap[p[6]]

846

del self.nodemap[p[6]]

846

del self.index[rev:]

847

del self.index[rev:]

847

848

# truncating the lazyindex also truncates the lazymap.

849

# truncating the lazyindex also truncates the lazymap.

849

if isinstance(self.index, lazyindex):

850

if isinstance(self.index, lazyindex):

850

self.index.trunc(end)

851

self.index.trunc(end)

851

852

853

def checksize(self):

854

def checksize(self):

854

expected = 0

855

expected = 0

855

if self.count():

856

if self.count():

856

expected = self.end(self.count() - 1)

857

expected = self.end(self.count() - 1)

857

858

try:

859

try:

859

f = self.opener(self.datafile)

860

f = self.opener(self.datafile)

860

f.seek(0, 2)

861

f.seek(0, 2)

861

actual = f.tell()

862

actual = f.tell()

862

dd = actual - expected

863

dd = actual - expected

863

except IOError, inst:

864

except IOError, inst:

864

if inst.errno != errno.ENOENT:

865

if inst.errno != errno.ENOENT:

865

raise

866

raise

866

dd = 0

867

dd = 0

867

868

try:

869

try:

869

f = self.opener(self.indexfile)

870

f = self.opener(self.indexfile)

870

f.seek(0, 2)

871

f.seek(0, 2)

871

actual = f.tell()

872

actual = f.tell()

872

s = struct.calcsize(indexformat)

873

s = struct.calcsize(indexformat)

873

i = actual / s

874

i = actual / s

874

di = actual - (i * s)

875

di = actual - (i * s)

875

except IOError, inst:

876

except IOError, inst:

876

if inst.errno != errno.ENOENT:

877

if inst.errno != errno.ENOENT:

877

raise

878

raise

878

di = 0

879

di = 0

879

880

return (dd, di)

881

return (dd, di)

881

882

883

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             """
             revlog.py - storage back-end for mercurial
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches
             Copyright 2005 Matt Mackall <mpm@selenic.com>
             This software may be used and distributed according to the terms
             of the GNU General Public License, incorporated herein by reference.
             """
             from node import *
             from i18n import gettext as _
             from demandload import demandload
             demandload(globals(), "binascii errno heapq mdiff os sha struct zlib")
             def hash(text, p1, p2):
                 """generate a hash from the given text and its parent hashes
                 This hash combines both the current file contents and its history
                 in a manner that makes it easy to distinguish nodes with the same
                 content in the revision graph.
                 """
                 l = [p1, p2]
                 l.sort()
                 s = sha.new(l[0])
                 s.update(l[1])
                 s.update(text)
                 return s.digest()
             def compress(text):
                 """ generate a possibly-compressed representation of text """
                 if not text: return ("", text)
                 if len(text) < 44:
                     if text[0] == '\0': return ("", text)
                     return ('u', text)
                 bin = zlib.compress(text)
                 if len(bin) > len(text):
                     if text[0] == '\0': return ("", text)
                     return ('u', text)
                 return ("", bin)
             def decompress(bin):
                 """ decompress the given input """
                 if not bin: return bin
                 t = bin[0]
                 if t == '\0': return bin
                 if t == 'x': return zlib.decompress(bin)
                 if t == 'u': return bin[1:]
                 raise RevlogError(_("unknown compression type %r") % t)
             indexformat = ">4l20s20s20s"
             class lazyparser(object):
                 """
                 this class avoids the need to parse the entirety of large indices
                 By default we parse and load 1000 entries at a time.
                 If no position is specified, we load the whole index, and replace
                 the lazy objects in revlog with the underlying objects for
                 efficiency in cases where we look at most of the nodes.
                 """
                 def __init__(self, data, revlog):
                     self.data = data
                     self.s = struct.calcsize(indexformat)
                     self.l = len(data)/self.s
                     self.index = [None] * self.l
                     self.map = {nullid: -1}
                     self.all = 0
                     self.revlog = revlog
                 def trunc(self, pos):
                     self.l = pos/self.s
                 def load(self, pos=None):
                     if self.all: return
                     if pos is not None:
                         block = pos / 1000
                         i = block * 1000
                         end = min(self.l, i + 1000)
                     else:
                         self.all = 1
                         i = 0
                         end = self.l
                         self.revlog.index = self.index
                         self.revlog.nodemap = self.map
                     while i < end:
                         d = self.data[i * self.s: (i + 1) * self.s]
                         e = struct.unpack(indexformat, d)
                         self.index[i] = e
                         self.map[e[6]] = i
                         i += 1
             class lazyindex(object):
                 """a lazy version of the index array"""
                 def __init__(self, parser):
                     self.p = parser
                 def __len__(self):
                     return len(self.p.index)
                 def load(self, pos):
                     if pos < 0:
                         pos += len(self.p.index)
                     self.p.load(pos)
                     return self.p.index[pos]
                 def __getitem__(self, pos):
                     return self.p.index[pos] or self.load(pos)
                 def __delitem__(self, pos):
                     del self.p.index[pos]
                 def append(self, e):
                     self.p.index.append(e)
                 def trunc(self, pos):
                     self.p.trunc(pos)
             class lazymap(object):
                 """a lazy version of the node map"""
                 def __init__(self, parser):
                     self.p = parser
                 def load(self, key):
                     if self.p.all: return
                     n = self.p.data.find(key)
                     if n < 0:
                         raise KeyError(key)
                     pos = n / self.p.s
                     self.p.load(pos)
                 def __contains__(self, key):
                     self.p.load()
                     return key in self.p.map
                 def __iter__(self):
                     yield nullid
                     for i in xrange(self.p.l):
                         try:
                             yield self.p.index[i][6]
                         except:
                             self.p.load(i)
                             yield self.p.index[i][6]
                 def __getitem__(self, key):
                     try:
                         return self.p.map[key]
                     except KeyError:
                         try:
                             self.load(key)
                             return self.p.map[key]
                         except KeyError:
                             raise KeyError("node " + hex(key))
                 def __setitem__(self, key, val):
                     self.p.map[key] = val
                 def __delitem__(self, key):
                     del self.p.map[key]
             class RevlogError(Exception): pass
             class revlog(object):
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, includings its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 """
                 def __init__(self, opener, indexfile, datafile):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     """
                     self.indexfile = indexfile
                     self.datafile = datafile
                     self.opener = opener
                     self.indexstat = None
                     self.cache = None
                     self.chunkcache = None
                     self.load()
                 def load(self):
                     try:
                         f = self.opener(self.indexfile)
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         i = ""
                     else:
                         try:
                             st = os.fstat(f.fileno())
                         except AttributeError, inst:
                             st = None
                         else:
                             oldst = self.indexstat
                             if (oldst and st.st_dev == oldst.st_dev
                                 and st.st_ino == oldst.st_ino
                                 and st.st_mtime == oldst.st_mtime
                                 and st.st_ctime == oldst.st_ctime):
                                 return
                         self.indexstat = st
                         i = f.read()
                     if i and i[:4] != "\0\0\0\0":
                         raise RevlogError(_("incompatible revlog signature on %s") %
                                           self.indexfile)
                     if len(i) > 10000:
                         # big index, let's parse it on demand
                         parser = lazyparser(i, self)
                         self.index = lazyindex(parser)
                         self.nodemap = lazymap(parser)
                     else:
                         s = struct.calcsize(indexformat)
                         l = len(i) / s
                         self.index = [None] * l
                         m = [None] * l
                         n = 0
                         for f in xrange(0, l * s, s):
                             # offset, size, base, linkrev, p1, p2, nodeid
                             e = struct.unpack(indexformat, i[f:f + s])
                             m[n] = (e[6], n)
                             self.index[n] = e
                             n += 1
                         self.nodemap = dict(m)
                         self.nodemap[nullid] = -1
                 def tip(self): return self.node(len(self.index) - 1)
                 def count(self): return len(self.index)
                 def node(self, rev): return (rev < 0) and nullid or self.index[rev][6]
                 def rev(self, node):
                     try:
                         return self.nodemap[node]
                     except KeyError:
                         raise RevlogError(_('%s: no node %s') % (self.indexfile, hex(node)))
                 def linkrev(self, node): return self.index[self.rev(node)][3]
                 def parents(self, node):
                     if node == nullid: return (nullid, nullid)
                     return self.index[self.rev(node)][4:6]
-                def start(self, rev): return self.index[rev][0]
+                def start(self, rev): return (rev < 0) and -1 or self.index[rev][0]
-                def length(self, rev): return self.index[rev][1]
+                def length(self, rev):
+                    if rev < 0:
+                        return 0
+                    else:
+                        return self.index[rev][1]
                 def end(self, rev): return self.start(rev) + self.length(rev)
-                def base(self, rev): return self.index[rev][2]
+                def base(self, rev): return (rev < 0) and rev or self.index[rev][2]
                 def reachable(self, rev, stop=None):
                     reachable = {}
                     visit = [rev]
                     reachable[rev] = 1
                     if stop:
                         stopn = self.rev(stop)
                     else:
                         stopn = 0
                     while visit:
                         n = visit.pop(0)
                         if n == stop:
                             continue
                         if n == nullid:
                             continue
                         for p in self.parents(n):
                             if self.rev(p) < stopn:
                                 continue
                             if p not in reachable:
                                 reachable[p] = 1
                                 visit.append(p)
                     return reachable
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a tuple containing three elements. Elements 1 and 2 contain
                     a final list bases and heads after all the unreachable ones have been
                     pruned.  Element 0 contains a topologically sorted list of all
                     nodes that satisfy these constraints:
 . All nodes must be descended from a node in roots (the nodes on
                        roots are considered descended from themselves).
 . All nodes must also be ancestors of a node in heads (the nodes in
                        heads are considered to be their own ancestors).
                     If roots is unspecified, nullid is assumed as the only root.
                     If heads is unspecified, it is taken to be the output of the
                     heads method (i.e. a list of all nodes in the repository that
                     have no children)."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [nullid] # Everybody's a descendent of nullid
                         lowestrev = -1
                     if (lowestrev == -1) and (heads is None):
                         # We want _all_ the nodes!
                         return ([self.node(r) for r in xrange(0, self.count())],
                                 [nullid], list(self.heads()))
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = self.count() - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = {}
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = heads[:]
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, 0)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendent of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors[n] = 1 # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.extend([p for p in self.parents(n) if
                                                        p != nullid])
                                 elif n in heads: # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > -1:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [n for n in roots if n in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(n) for n in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = -1
                             roots = [nullid]
                     # Transform our roots list into a 'set' (i.e. a dictionary where the
                     # values don't matter.
                     descendents = dict.fromkeys(roots, 1)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendents.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descedents, empty parents will look like
                     # they're descendents.
                     for r in xrange(max(lowestrev, 0), highestrev + 1):
                         n = self.node(r)
                         isdescendent = False
                         if lowestrev == -1:  # Everybody is a descendent of nullid
                             isdescendent = True
                         elif n in descendents:
                             # n is already a descendent
                             isdescendent = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendents before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendents, it's not a root.
                                 if (p[0] in descendents) or (p[1] in descendents):
                                     roots.pop(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendent if either of its parents are
                             # descendents.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendents) or (p[1] in descendents):
                                 descendents[n] = 1
                                 isdescendent = True
                         if isdescendent and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendents and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = 1
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = 1
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [n for n in heads.iterkeys() if heads[n] != 0]
                     roots = roots.keys()
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def heads(self, start=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     """
                     if start is None:
                         start = nullid
                     reachable = {start: 1}
                     heads = {start: 1}
                     startrev = self.rev(start)
                     for r in xrange(startrev + 1, self.count()):
                         n = self.node(r)
                         for pn in self.parents(n):
                             if pn in reachable:
                                 reachable[n] = 1
                                 heads[n] = 1
                             if pn in heads:
                                 del heads[pn]
                     return heads.keys()
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in range(p + 1, self.count()):
                         n = self.node(r)
                         for pn in self.parents(n):
                             if pn == node:
                                 c.append(n)
                                 continue
                             elif pn == nullid:
                                 continue
                     return c
                 def lookup(self, id):
                     """locate a node based on revision number or subset of hex nodeid"""
                     try:
                         rev = int(id)
                         if str(rev) != id: raise ValueError
                         if rev < 0: rev = self.count() + rev
                         if rev < 0 or rev >= self.count(): raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         c = []
                         for n in self.nodemap:
                             if hex(n).startswith(id):
                                 c.append(n)
                         if len(c) > 1: raise RevlogError(_("Ambiguous identifier"))
                         if len(c) < 1: raise RevlogError(_("No match found"))
                         return c[0]
                     return None
                 def diff(self, a, b):
                     """return a delta between two revisions"""
                     return mdiff.textdiff(a, b)
                 def patches(self, t, pl):
                     """apply a list of patches to a string"""
                     return mdiff.patches(t, pl)
                 def chunk(self, rev):
                     start, length = self.start(rev), self.length(rev)
                     end = start + length
                     def loadcache():
                         cache_length = max(4096 * 1024, length) # 4Mo
                         df = self.opener(self.datafile)
                         df.seek(start)
                         self.chunkcache = (start, df.read(cache_length))
                     if not self.chunkcache:
                         loadcache()
                     cache_start = self.chunkcache[0]
                     cache_end = cache_start + len(self.chunkcache[1])
                     if start >= cache_start and end <= cache_end:
                         # it is cached
                         offset = start - cache_start
                     else:
                         loadcache()
                         offset = 0
                     #def checkchunk():
                     #    df = self.opener(self.datafile)
                     #    df.seek(start)
                     #    return df.read(length)
                     #assert s == checkchunk()
                     return decompress(self.chunkcache[1][offset:offset + length])
                 def delta(self, node):
                     """return or calculate a delta between a node and its predecessor"""
                     r = self.rev(node)
-                    b = self.base(r)
+                    return self.revdiff(r - 1, r)
-                    if r == b:
-                        return self.diff(self.revision(self.node(r - 1)),
+                def revdiff(self, rev1, rev2):
-                                         self.revision(node))
+                    """return or calculate a delta between two revisions"""
+                    b1 = self.base(rev1)
+                    b2 = self.base(rev2)
+                    if b1 == b2 and rev1 + 1 == rev2:
+                        return self.chunk(rev2)
                     else:
-                        return self.chunk(r)
+                        return self.diff(self.revision(self.node(rev1)),
+                                         self.revision(self.node(rev2)))
                 def revision(self, node):
                     """return an uncompressed revision of a given"""
                     if node == nullid: return ""
                     if self.cache and self.cache[0] == node: return self.cache[2]
                     # look up what we need to read
                     text = None
                     rev = self.rev(node)
                     base = self.base(rev)
                     # do we have useful data cached?
                     if self.cache and self.cache[1] >= base and self.cache[1] < rev:
                         base = self.cache[1]
                         text = self.cache[2]
                     else:
                         text = self.chunk(base)
                     bins = []
                     for r in xrange(base + 1, rev + 1):
                         bins.append(self.chunk(r))
-                    text = mdiff.patches(text, bins)
+                    text = self.patches(text, bins)
                     p1, p2 = self.parents(node)
                     if node != hash(text, p1, p2):
                         raise RevlogError(_("integrity check failed on %s:%d")
                                       % (self.datafile, rev))
                     self.cache = (node, rev, text)
                     return text
                 def addrevision(self, text, transaction, link, p1=None, p2=None, d=None):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     d - an optional precomputed delta
                     """
                     if text is None: text = ""
                     if p1 is None: p1 = self.tip()
                     if p2 is None: p2 = nullid
                     node = hash(text, p1, p2)
                     if node in self.nodemap:
                         return node
                     n = self.count()
                     t = n - 1
                     if n:
                         base = self.base(t)
                         start = self.start(base)
                         end = self.end(t)
                         if not d:
                             prev = self.revision(self.tip())
                             d = self.diff(prev, str(text))
                         data = compress(d)
                         l = len(data[1]) + len(data[0])
                         dist = end - start + l
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if not n or dist > len(text) * 2:
                         data = compress(text)
                         l = len(data[1]) + len(data[0])
                         base = n
                     else:
                         base = self.base(t)
                     offset = 0
                     if t >= 0:
                         offset = self.end(t)
                     e = (offset, l, base, link, p1, p2, node)
                     self.index.append(e)
                     self.nodemap[node] = n
                     entry = struct.pack(indexformat, *e)
                     transaction.add(self.datafile, e[0])
                     f = self.opener(self.datafile, "a")
                     if data[0]:
                         f.write(data[0])
                     f.write(data[1])
                     transaction.add(self.indexfile, n * len(entry))
                     self.opener(self.indexfile, "a").write(entry)
                     self.cache = (node, n, text)
                     return node
                 def ancestor(self, a, b):
                     """calculate the least common ancestor of nodes a and b"""
                     # calculate the distance of every node from root
                     dist = {nullid: 0}
                     for i in xrange(self.count()):
                         n = self.node(i)
                         p1, p2 = self.parents(n)
                         dist[n] = max(dist[p1], dist[p2]) + 1
                     # traverse ancestors in order of decreasing distance from root
                     def ancestors(node):
                         # we store negative distances because heap returns smallest member
                         h = [(-dist[node], node)]
                         seen = {}
                         while h:
                             d, n = heapq.heappop(h)
                             if n not in seen:
                                 seen[n] = 1
                                 yield (-d, n)
                                 for p in self.parents(n):
                                     heapq.heappush(h, (-dist[p], p))
                     def generations(node):
                         sg, s = None, {}
                         for g,n in ancestors(node):
                             if g != sg:
                                 if sg:
                                     yield sg, s
                                 sg, s = g, {n:1}
                             else:
                                 s[n] = 1
                         yield sg, s
                     x = generations(a)
                     y = generations(b)
                     gx = x.next()
                     gy = y.next()
                     # increment each ancestor list until it is closer to root than
                     # the other, or they match
                     while 1:
                         #print "ancestor gen %s %s" % (gx[0], gy[0])
                         if gx[0] == gy[0]:
                             # find the intersection
                             i = [ n for n in gx[1] if n in gy[1] ]
                             if i:
                                 return i[0]
                             else:
                                 #print "next"
                                 gy = y.next()
                                 gx = x.next()
                         elif gx[0] < gy[0]:
                             #print "next y"
                             gy = y.next()
                         else:
                             #print "next x"
                             gx = x.next()
                 def group(self, nodelist, lookup, infocollect=None):
                     """calculate a delta group
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. the first delta is
                     parent(nodes[0]) -> nodes[0] the receiver is guaranteed to
                     have this parent as it has all history before these
                     changesets. parent is parent[0]
                     """
                     revs = [self.rev(n) for n in nodelist]
                     # if we don't have any revisions touched by these changesets, bail
                     if not revs:
                         yield struct.pack(">l", 0)
                         return
                     # add the parent of the first rev
                     p = self.parents(self.node(revs[0]))[0]
                     revs.insert(0, self.rev(p))
                     # build deltas
                     for d in xrange(0, len(revs) - 1):
                         a, b = revs[d], revs[d + 1]
-                        na = self.node(a)
                         nb = self.node(b)
                         if infocollect is not None:
                             infocollect(nb)
-                        # do we need to construct a new delta?
+                        d = self.revdiff(a, b)
-                        if a + 1 != b or self.base(b) == b:
-                            ta = self.revision(na)
-                            tb = self.revision(nb)
-                            d = self.diff(ta, tb)
-                        else:
-                            d = self.chunk(b)
                         p = self.parents(nb)
                         meta = nb + p[0] + p[1] + lookup(nb)
                         l = struct.pack(">l", len(meta) + len(d) + 4)
                         yield l
                         yield meta
                         yield d
                     yield struct.pack(">l", 0)
                 def addgroup(self, revs, linkmapper, transaction, unique=0):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     """
                     #track the base of the current delta log
                     r = self.count()
                     t = r - 1
                     node = nullid
                     base = prev = -1
                     start = end = measure = 0
                     if r:
                         base = self.base(t)
                         start = self.start(base)
                         end = self.end(t)
                         measure = self.length(base)
                         prev = self.tip()
                     transaction.add(self.datafile, end)
                     transaction.add(self.indexfile, r * struct.calcsize(indexformat))
                     dfh = self.opener(self.datafile, "a")
                     ifh = self.opener(self.indexfile, "a")
                     # loop through our set of deltas
                     chain = None
                     for chunk in revs:
                         node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80])
                         link = linkmapper(cs)
                         if node in self.nodemap:
                             # this can happen if two branches make the same change
                             # if unique:
                             #    raise RevlogError(_("already have %s") % hex(node[:4]))
                             chain = node
                             continue
                         delta = chunk[80:]
                         for p in (p1, p2):
                             if not p in self.nodemap:
                                 raise RevlogError(_("unknown parent %s") % short(p1))
                         if not chain:
                             # retrieve the parent revision of the delta chain
                             chain = p1
                             if not chain in self.nodemap:
                                 raise RevlogError(_("unknown base %s") % short(chain[:4]))
                         # full versions are inserted when the needed deltas become
                         # comparable to the uncompressed text or when the previous
                         # version is not the one we have a delta against. We use
                         # the size of the previous full rev as a proxy for the
                         # current size.
                         if chain == prev:
                             tempd = compress(delta)
                             cdelta = tempd[0] + tempd[1]
                         if chain != prev or (end - start + len(cdelta)) > measure * 2:
                             # flush our writes here so we can read it in revision
                             dfh.flush()
                             ifh.flush()
                             text = self.revision(chain)
                             text = self.patches(text, [delta])
                             chk = self.addrevision(text, transaction, link, p1, p2)
                             if chk != node:
                                 raise RevlogError(_("consistency error adding group"))
                             measure = len(text)
                         else:
                             e = (end, len(cdelta), base, link, p1, p2, node)
                             self.index.append(e)
                             self.nodemap[node] = r
                             dfh.write(cdelta)
                             ifh.write(struct.pack(indexformat, *e))
                         t, r, chain, prev = r, r + 1, node, node
                         base = self.base(t)
                         start = self.start(base)
                         end = self.end(t)
                     dfh.close()
                     ifh.close()
                     return node
                 def strip(self, rev, minlink):
                     if self.count() == 0 or rev >= self.count():
                         return
                     # When stripping away a revision, we need to make sure it
                     # does not actually belong to an older changeset.
                     # The minlink parameter defines the oldest revision
                     # we're allowed to strip away.
                     while minlink > self.index[rev][3]:
                         rev += 1
                         if rev >= self.count():
                             return
                     # first truncate the files on disk
                     end = self.start(rev)
                     self.opener(self.datafile, "a").truncate(end)
                     end = rev * struct.calcsize(indexformat)
                     self.opener(self.indexfile, "a").truncate(end)
                     # then reset internal state in memory to forget those revisions
                     self.cache = None
                     self.chunkcache = None
                     for p in self.index[rev:]:
                         del self.nodemap[p[6]]
                     del self.index[rev:]
                     # truncating the lazyindex also truncates the lazymap.
                     if isinstance(self.index, lazyindex):
                         self.index.trunc(end)
                 def checksize(self):
                     expected = 0
                     if self.count():
                         expected = self.end(self.count() - 1)
                     try:
                         f = self.opener(self.datafile)
                         f.seek(0, 2)
                         actual = f.tell()
                         dd = actual - expected
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         dd = 0
                     try:
                         f = self.opener(self.indexfile)
                         f.seek(0, 2)
                         actual = f.tell()
                         s = struct.calcsize(indexformat)
                         i = actual / s
                         di = actual - (i * s)
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         di = 0
                     return (dd, di)