upstream/mercurial-mirror Commit - r14523:b4175b72

1

# revlog.py - storage back-end for mercurial

1

# revlog.py - storage back-end for mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

"""Storage back-end for Mercurial.

8

"""Storage back-end for Mercurial.

9

10

This provides efficient delta storage with O(1) retrieve and append

10

This provides efficient delta storage with O(1) retrieve and append

11

and O(changes) merge between branches.

11

and O(changes) merge between branches.

12

"""

12

"""

13

14

# import stuff from node for others to import from revlog

14

# import stuff from node for others to import from revlog

15

from node import bin, hex, nullid, nullrev

15

from node import bin, hex, nullid, nullrev

16

from i18n import _

16

from i18n import _

17

import ancestor, mdiff, parsers, error, util, dagutil

17

import ancestor, mdiff, parsers, error, util, dagutil

18

import struct, zlib, errno

18

import struct, zlib, errno

19

20

_pack = struct.pack

20

_pack = struct.pack

21

_unpack = struct.unpack

21

_unpack = struct.unpack

22

_compress = zlib.compress

22

_compress = zlib.compress

23

_decompress = zlib.decompress

23

_decompress = zlib.decompress

24

_sha = util.sha1

24

_sha = util.sha1

25

26

# revlog header flags

26

# revlog header flags

27

REVLOGV0 = 0

27

REVLOGV0 = 0

28

REVLOGNG = 1

28

REVLOGNG = 1

29

REVLOGNGINLINEDATA = (1 << 16)

29

REVLOGNGINLINEDATA = (1 << 16)

30

REVLOGGENERALDELTA = (1 << 17)

30

REVLOGGENERALDELTA = (1 << 17)

31

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

31

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

32

REVLOG_DEFAULT_FORMAT = REVLOGNG

32

REVLOG_DEFAULT_FORMAT = REVLOGNG

33

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

33

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

34

REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGGENERALDELTA

34

REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGGENERALDELTA

35

36

# revlog index flags

36

# revlog index flags

37

REVIDX_KNOWN_FLAGS = 0

37

REVIDX_KNOWN_FLAGS = 0

38

39

# max size of revlog with inline data

39

# max size of revlog with inline data

40

_maxinline = 131072

40

_maxinline = 131072

41

_chunksize = 1048576

41

_chunksize = 1048576

42

43

RevlogError = error.RevlogError

43

RevlogError = error.RevlogError

44

LookupError = error.LookupError

44

LookupError = error.LookupError

45

46

def getoffset(q):

46

def getoffset(q):

47

return int(q >> 16)

47

return int(q >> 16)

48

49

def gettype(q):

49

def gettype(q):

50

return int(q & 0xFFFF)

50

return int(q & 0xFFFF)

51

52

def offset_type(offset, type):

52

def offset_type(offset, type):

53

return long(long(offset) << 16 | type)

53

return long(long(offset) << 16 | type)

54

55

nullhash = _sha(nullid)

55

nullhash = _sha(nullid)

56

57

def hash(text, p1, p2):

57

def hash(text, p1, p2):

58

"""generate a hash from the given text and its parent hashes

58

"""generate a hash from the given text and its parent hashes

59

60

This hash combines both the current file contents and its history

60

This hash combines both the current file contents and its history

61

in a manner that makes it easy to distinguish nodes with the same

61

in a manner that makes it easy to distinguish nodes with the same

62

content in the revision graph.

62

content in the revision graph.

63

"""

63

"""

64

# As of now, if one of the parent node is null, p2 is null

64

# As of now, if one of the parent node is null, p2 is null

65

if p2 == nullid:

65

if p2 == nullid:

66

# deep copy of a hash is faster than creating one

66

# deep copy of a hash is faster than creating one

67

s = nullhash.copy()

67

s = nullhash.copy()

68

s.update(p1)

68

s.update(p1)

69

else:

69

else:

70

# none of the parent nodes are nullid

70

# none of the parent nodes are nullid

71

l = [p1, p2]

71

l = [p1, p2]

72

l.sort()

72

l.sort()

73

s = _sha(l[0])

73

s = _sha(l[0])

74

s.update(l[1])

74

s.update(l[1])

75

s.update(text)

75

s.update(text)

76

return s.digest()

76

return s.digest()

77

78

def compress(text):

78

def compress(text):

79

""" generate a possibly-compressed representation of text """

79

""" generate a possibly-compressed representation of text """

80

if not text:

80

if not text:

81

return ("", text)

81

return ("", text)

82

l = len(text)

82

l = len(text)

83

bin = None

83

bin = None

84

if l < 44:

84

if l < 44:

85

pass

85

pass

86

elif l > 1000000:

86

elif l > 1000000:

87

# zlib makes an internal copy, thus doubling memory usage for

87

# zlib makes an internal copy, thus doubling memory usage for

88

# large files, so lets do this in pieces

88

# large files, so lets do this in pieces

89

z = zlib.compressobj()

89

z = zlib.compressobj()

90

p = []

90

p = []

91

pos = 0

91

pos = 0

92

while pos < l:

92

while pos < l:

93

pos2 = pos + 2**20

93

pos2 = pos + 2**20

94

p.append(z.compress(text[pos:pos2]))

94

p.append(z.compress(text[pos:pos2]))

95

pos = pos2

95

pos = pos2

96

p.append(z.flush())

96

p.append(z.flush())

97

if sum(map(len, p)) < l:

97

if sum(map(len, p)) < l:

98

bin = "".join(p)

98

bin = "".join(p)

99

else:

99

else:

100

bin = _compress(text)

100

bin = _compress(text)

101

if bin is None or len(bin) > l:

101

if bin is None or len(bin) > l:

102

if text[0] == '\0':

102

if text[0] == '\0':

103

return ("", text)

103

return ("", text)

104

return ('u', text)

104

return ('u', text)

105

return ("", bin)

105

return ("", bin)

106

107

def decompress(bin):

107

def decompress(bin):

108

""" decompress the given input """

108

""" decompress the given input """

109

if not bin:

109

if not bin:

110

return bin

110

return bin

111

t = bin[0]

111

t = bin[0]

112

if t == '\0':

112

if t == '\0':

113

return bin

113

return bin

114

if t == 'x':

114

if t == 'x':

115

return _decompress(bin)

115

return _decompress(bin)

116

if t == 'u':

116

if t == 'u':

117

return bin[1:]

117

return bin[1:]

118

raise RevlogError(_("unknown compression type %r") % t)

118

raise RevlogError(_("unknown compression type %r") % t)

119

120

indexformatv0 = ">4l20s20s20s"

120

indexformatv0 = ">4l20s20s20s"

121

v0shaoffset = 56

121

v0shaoffset = 56

122

123

class revlogoldio(object):

123

class revlogoldio(object):

124

def __init__(self):

124

def __init__(self):

125

self.size = struct.calcsize(indexformatv0)

125

self.size = struct.calcsize(indexformatv0)

126

127

def parseindex(self, data, inline):

127

def parseindex(self, data, inline):

128

s = self.size

128

s = self.size

129

index = []

129

index = []

130

nodemap = {nullid: nullrev}

130

nodemap = {nullid: nullrev}

131

n = off = 0

131

n = off = 0

132

l = len(data)

132

l = len(data)

133

while off + s <= l:

133

while off + s <= l:

134

cur = data[off:off + s]

134

cur = data[off:off + s]

135

off += s

135

off += s

136

e = _unpack(indexformatv0, cur)

136

e = _unpack(indexformatv0, cur)

137

# transform to revlogv1 format

137

# transform to revlogv1 format

138

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

138

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

139

nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])

139

nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])

140

index.append(e2)

140

index.append(e2)

141

nodemap[e[6]] = n

141

nodemap[e[6]] = n

142

n += 1

142

n += 1

143

144

# add the magic null revision at -1

144

# add the magic null revision at -1

145

index.append((0, 0, 0, -1, -1, -1, -1, nullid))

145

index.append((0, 0, 0, -1, -1, -1, -1, nullid))

146

147

return index, nodemap, None

147

return index, nodemap, None

148

149

def packentry(self, entry, node, version, rev):

149

def packentry(self, entry, node, version, rev):

150

if gettype(entry[0]):

150

if gettype(entry[0]):

151

raise RevlogError(_("index entry flags need RevlogNG"))

151

raise RevlogError(_("index entry flags need RevlogNG"))

152

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

152

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

153

node(entry[5]), node(entry[6]), entry[7])

153

node(entry[5]), node(entry[6]), entry[7])

154

return _pack(indexformatv0, *e2)

154

return _pack(indexformatv0, *e2)

155

156

# index ng:

156

# index ng:

157

# 6 bytes: offset

157

# 6 bytes: offset

158

# 2 bytes: flags

158

# 2 bytes: flags

159

# 4 bytes: compressed length

159

# 4 bytes: compressed length

160

# 4 bytes: uncompressed length

160

# 4 bytes: uncompressed length

161

# 4 bytes: base rev

161

# 4 bytes: base rev

162

# 4 bytes: link rev

162

# 4 bytes: link rev

163

# 4 bytes: parent 1 rev

163

# 4 bytes: parent 1 rev

164

# 4 bytes: parent 2 rev

164

# 4 bytes: parent 2 rev

165

# 32 bytes: nodeid

165

# 32 bytes: nodeid

166

indexformatng = ">Qiiiiii20s12x"

166

indexformatng = ">Qiiiiii20s12x"

167

ngshaoffset = 32

167

ngshaoffset = 32

168

versionformat = ">I"

168

versionformat = ">I"

169

170

class revlogio(object):

170

class revlogio(object):

171

def __init__(self):

171

def __init__(self):

172

self.size = struct.calcsize(indexformatng)

172

self.size = struct.calcsize(indexformatng)

173

174

def parseindex(self, data, inline):

174

def parseindex(self, data, inline):

175

# call the C implementation to parse the index data

175

# call the C implementation to parse the index data

176

index, cache = parsers.parse_index2(data, inline)

176

index, cache = parsers.parse_index2(data, inline)

177

return index, None, cache

177

return index, None, cache

178

179

def packentry(self, entry, node, version, rev):

179

def packentry(self, entry, node, version, rev):

180

p = _pack(indexformatng, *entry)

180

p = _pack(indexformatng, *entry)

181

if rev == 0:

181

if rev == 0:

182

p = _pack(versionformat, version) + p[4:]

182

p = _pack(versionformat, version) + p[4:]

183

return p

183

return p

184

185

class revlog(object):

185

class revlog(object):

186

"""

186

"""

187

the underlying revision storage object

187

the underlying revision storage object

188

189

A revlog consists of two parts, an index and the revision data.

189

A revlog consists of two parts, an index and the revision data.

190

191

The index is a file with a fixed record size containing

191

The index is a file with a fixed record size containing

192

information on each revision, including its nodeid (hash), the

192

information on each revision, including its nodeid (hash), the

193

nodeids of its parents, the position and offset of its data within

193

nodeids of its parents, the position and offset of its data within

194

the data file, and the revision it's based on. Finally, each entry

194

the data file, and the revision it's based on. Finally, each entry

195

contains a linkrev entry that can serve as a pointer to external

195

contains a linkrev entry that can serve as a pointer to external

196

data.

196

data.

197

198

The revision data itself is a linear collection of data chunks.

198

The revision data itself is a linear collection of data chunks.

199

Each chunk represents a revision and is usually represented as a

199

Each chunk represents a revision and is usually represented as a

200

delta against the previous chunk. To bound lookup time, runs of

200

delta against the previous chunk. To bound lookup time, runs of

201

deltas are limited to about 2 times the length of the original

201

deltas are limited to about 2 times the length of the original

202

version data. This makes retrieval of a version proportional to

202

version data. This makes retrieval of a version proportional to

203

its size, or O(1) relative to the number of revisions.

203

its size, or O(1) relative to the number of revisions.

204

205

Both pieces of the revlog are written to in an append-only

205

Both pieces of the revlog are written to in an append-only

206

fashion, which means we never need to rewrite a file to insert or

206

fashion, which means we never need to rewrite a file to insert or

207

remove data, and can use some simple techniques to avoid the need

207

remove data, and can use some simple techniques to avoid the need

208

for locking while reading.

208

for locking while reading.

209

"""

209

"""

210

def __init__(self, opener, indexfile):

210

def __init__(self, opener, indexfile):

211

"""

211

"""

212

create a revlog object

212

create a revlog object

213

214

opener is a function that abstracts the file opening operation

214

opener is a function that abstracts the file opening operation

215

and can be used to implement COW semantics or the like.

215

and can be used to implement COW semantics or the like.

216

"""

216

"""

217

self.indexfile = indexfile

217

self.indexfile = indexfile

218

self.datafile = indexfile[:-2] + ".d"

218

self.datafile = indexfile[:-2] + ".d"

219

self.opener = opener

219

self.opener = opener

220

self._cache = None

220

self._cache = None

221

self._basecache = (0, 0)

221

self._basecache = (0, 0)

222

self._chunkcache = (0, '')

222

self._chunkcache = (0, '')

223

self.index = []

223

self.index = []

224

self._pcache = {}

224

self._pcache = {}

225

self._nodecache = {nullid: nullrev}

225

self._nodecache = {nullid: nullrev}

226

self._nodepos = None

226

self._nodepos = None

227

228

v = REVLOG_DEFAULT_VERSION

228

v = REVLOG_DEFAULT_VERSION

229

if hasattr(opener, 'options'):

229

if hasattr(opener, 'options'):

230

if 'revlogv1' in opener.options:

230

if 'revlogv1' in opener.options:

231

if 'generaldelta' in opener.options:

231

if 'generaldelta' in opener.options:

232

v |= REVLOGGENERALDELTA

232

v |= REVLOGGENERALDELTA

233

else:

233

else:

234

v = 0

234

v = 0

235

236

i = ''

236

i = ''

237

self._initempty = True

237

self._initempty = True

238

try:

238

try:

239

f = self.opener(self.indexfile)

239

f = self.opener(self.indexfile)

240

i = f.read()

240

i = f.read()

241

f.close()

241

f.close()

242

if len(i) > 0:

242

if len(i) > 0:

243

v = struct.unpack(versionformat, i[:4])[0]

243

v = struct.unpack(versionformat, i[:4])[0]

244

self._initempty = False

244

self._initempty = False

245

except IOError, inst:

245

except IOError, inst:

246

if inst.errno != errno.ENOENT:

246

if inst.errno != errno.ENOENT:

247

raise

247

raise

248

249

self.version = v

249

self.version = v

250

self._inline = v & REVLOGNGINLINEDATA

250

self._inline = v & REVLOGNGINLINEDATA

251

self._generaldelta = v & REVLOGGENERALDELTA

251

self._generaldelta = v & REVLOGGENERALDELTA

252

flags = v & ~0xFFFF

252

flags = v & ~0xFFFF

253

fmt = v & 0xFFFF

253

fmt = v & 0xFFFF

254

if fmt == REVLOGV0 and flags:

254

if fmt == REVLOGV0 and flags:

255

raise RevlogError(_("index %s unknown flags %#04x for format v0")

255

raise RevlogError(_("index %s unknown flags %#04x for format v0")

256

% (self.indexfile, flags >> 16))

256

% (self.indexfile, flags >> 16))

257

elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:

257

elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:

258

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

258

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

259

% (self.indexfile, flags >> 16))

259

% (self.indexfile, flags >> 16))

260

elif fmt > REVLOGNG:

260

elif fmt > REVLOGNG:

261

raise RevlogError(_("index %s unknown format %d")

261

raise RevlogError(_("index %s unknown format %d")

262

% (self.indexfile, fmt))

262

% (self.indexfile, fmt))

263

264

self._io = revlogio()

264

self._io = revlogio()

265

if self.version == REVLOGV0:

265

if self.version == REVLOGV0:

266

self._io = revlogoldio()

266

self._io = revlogoldio()

267

try:

267

try:

268

d = self._io.parseindex(i, self._inline)

268

d = self._io.parseindex(i, self._inline)

269

except (ValueError, IndexError):

269

except (ValueError, IndexError):

270

raise RevlogError(_("index %s is corrupted") % (self.indexfile))

270

raise RevlogError(_("index %s is corrupted") % (self.indexfile))

271

self.index, nodemap, self._chunkcache = d

271

self.index, nodemap, self._chunkcache = d

272

if nodemap is not None:

272

if nodemap is not None:

273

self.nodemap = self._nodecache = nodemap

273

self.nodemap = self._nodecache = nodemap

274

if not self._chunkcache:

274

if not self._chunkcache:

275

self._chunkclear()

275

self._chunkclear()

276

277

def tip(self):

277

def tip(self):

278

return self.node(len(self.index) - 2)

278

return self.node(len(self.index) - 2)

279

def __len__(self):

279

def __len__(self):

280

return len(self.index) - 1

280

return len(self.index) - 1

281

def __iter__(self):

281

def __iter__(self):

282

for i in xrange(len(self)):

282

for i in xrange(len(self)):

283

yield i

283

yield i

284

285

@util.propertycache

285

@util.propertycache

286

def nodemap(self):

286

def nodemap(self):

287

self.rev(self.node(0))

287

self.rev(self.node(0))

288

return self._nodecache

288

return self._nodecache

289

290

def rev(self, node):

290

def rev(self, node):

291

try:

291

try:

292

return self._nodecache[node]

292

return self._nodecache[node]

293

except KeyError:

293

except KeyError:

294

n = self._nodecache

294

n = self._nodecache

295

i = self.index

295

i = self.index

296

p = self._nodepos

296

p = self._nodepos

297

if p is None:

297

if p is None:

298

p = len(i) - 2

298

p = len(i) - 2

299

for r in xrange(p, -1, -1):

299

for r in xrange(p, -1, -1):

300

v = i[r][7]

300

v = i[r][7]

301

n[v] = r

301

n[v] = r

302

if v == node:

302

if v == node:

303

self._nodepos = r - 1

303

self._nodepos = r - 1

304

return r

304

return r

305

raise LookupError(node, self.indexfile, _('no node'))

305

raise LookupError(node, self.indexfile, _('no node'))

306

307

def node(self, rev):

307

def node(self, rev):

308

return self.index[rev][7]

308

return self.index[rev][7]

309

def linkrev(self, rev):

309

def linkrev(self, rev):

310

return self.index[rev][4]

310

return self.index[rev][4]

311

def parents(self, node):

311

def parents(self, node):

312

i = self.index

312

i = self.index

313

d = i[self.rev(node)]

313

d = i[self.rev(node)]

314

return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline

314

return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline

315

def parentrevs(self, rev):

315

def parentrevs(self, rev):

316

return self.index[rev][5:7]

316

return self.index[rev][5:7]

317

def start(self, rev):

317

def start(self, rev):

318

return int(self.index[rev][0] >> 16)

318

return int(self.index[rev][0] >> 16)

319

def end(self, rev):

319

def end(self, rev):

320

return self.start(rev) + self.length(rev)

320

return self.start(rev) + self.length(rev)

321

def length(self, rev):

321

def length(self, rev):

322

return self.index[rev][1]

322

return self.index[rev][1]

323

def chainbase(self, rev):

323

def chainbase(self, rev):

324

index = self.index

324

index = self.index

325

base = index[rev][3]

325

base = index[rev][3]

326

while base != rev:

326

while base != rev:

327

rev = base

327

rev = base

328

base = index[rev][3]

328

base = index[rev][3]

329

return base

329

return base

330

def flags(self, rev):

330

def flags(self, rev):

331

return self.index[rev][0] & 0xFFFF

331

return self.index[rev][0] & 0xFFFF

332

def rawsize(self, rev):

332

def rawsize(self, rev):

333

"""return the length of the uncompressed text for a given revision"""

333

"""return the length of the uncompressed text for a given revision"""

334

l = self.index[rev][2]

334

l = self.index[rev][2]

335

if l >= 0:

335

if l >= 0:

336

return l

336

return l

337

338

t = self.revision(self.node(rev))

338

t = self.revision(self.node(rev))

339

return len(t)

339

return len(t)

340

size = rawsize

340

size = rawsize

341

342

def reachable(self, node, stop=None):

342

def reachable(self, node, stop=None):

343

"""return the set of all nodes ancestral to a given node, including

343

"""return the set of all nodes ancestral to a given node, including

344

the node itself, stopping when stop is matched"""

344

the node itself, stopping when stop is matched"""

345

reachable = set((node,))

345

reachable = set((node,))

346

visit = [node]

346

visit = [node]

347

if stop:

347

if stop:

348

stopn = self.rev(stop)

348

stopn = self.rev(stop)

349

else:

349

else:

350

stopn = 0

350

stopn = 0

351

while visit:

351

while visit:

352

n = visit.pop(0)

352

n = visit.pop(0)

353

if n == stop:

353

if n == stop:

354

continue

354

continue

355

if n == nullid:

355

if n == nullid:

356

continue

356

continue

357

for p in self.parents(n):

357

for p in self.parents(n):

358

if self.rev(p) < stopn:

358

if self.rev(p) < stopn:

359

continue

359

continue

360

if p not in reachable:

360

if p not in reachable:

361

reachable.add(p)

361

reachable.add(p)

362

visit.append(p)

362

visit.append(p)

363

return reachable

363

return reachable

364

365

def ancestors(self, *revs):

365

def ancestors(self, *revs):

366

"""Generate the ancestors of 'revs' in reverse topological order.

366

"""Generate the ancestors of 'revs' in reverse topological order.

367

368

Yield a sequence of revision numbers starting with the parents

368

Yield a sequence of revision numbers starting with the parents

369

of each revision in revs, i.e., each revision is *not* considered

369

of each revision in revs, i.e., each revision is *not* considered

370

an ancestor of itself. Results are in breadth-first order:

370

an ancestor of itself. Results are in breadth-first order:

371

parents of each rev in revs, then parents of those, etc. Result

371

parents of each rev in revs, then parents of those, etc. Result

372

does not include the null revision."""

372

does not include the null revision."""

373

visit = list(revs)

373

visit = list(revs)

374

seen = set([nullrev])

374

seen = set([nullrev])

375

while visit:

375

while visit:

376

for parent in self.parentrevs(visit.pop(0)):

376

for parent in self.parentrevs(visit.pop(0)):

377

if parent not in seen:

377

if parent not in seen:

378

visit.append(parent)

378

visit.append(parent)

379

seen.add(parent)

379

seen.add(parent)

380

yield parent

380

yield parent

381

382

def descendants(self, *revs):

382

def descendants(self, *revs):

383

"""Generate the descendants of 'revs' in revision order.

383

"""Generate the descendants of 'revs' in revision order.

384

385

Yield a sequence of revision numbers starting with a child of

385

Yield a sequence of revision numbers starting with a child of

386

some rev in revs, i.e., each revision is *not* considered a

386

some rev in revs, i.e., each revision is *not* considered a

387

descendant of itself. Results are ordered by revision number (a

387

descendant of itself. Results are ordered by revision number (a

388

topological sort)."""

388

topological sort)."""

389

first = min(revs)

389

first = min(revs)

390

if first == nullrev:

390

if first == nullrev:

391

for i in self:

391

for i in self:

392

yield i

392

yield i

393

return

393

return

394

395

seen = set(revs)

395

seen = set(revs)

396

for i in xrange(first + 1, len(self)):

396

for i in xrange(first + 1, len(self)):

397

for x in self.parentrevs(i):

397

for x in self.parentrevs(i):

398

if x != nullrev and x in seen:

398

if x != nullrev and x in seen:

399

seen.add(i)

399

seen.add(i)

400

yield i

400

yield i

401

break

401

break

402

403

def findcommonmissing(self, common=None, heads=None):

403

def findcommonmissing(self, common=None, heads=None):

404

"""Return a tuple of the ancestors of common and the ancestors of heads

404

"""Return a tuple of the ancestors of common and the ancestors of heads

405

that are not ancestors of common.

405

that are not ancestors of common.

406

407

More specifically, the second element is a list of nodes N such that

407

More specifically, the second element is a list of nodes N such that

408

every N satisfies the following constraints:

408

every N satisfies the following constraints:

409

410

1. N is an ancestor of some node in 'heads'

410

1. N is an ancestor of some node in 'heads'

411

2. N is not an ancestor of any node in 'common'

411

2. N is not an ancestor of any node in 'common'

412

413

The list is sorted by revision number, meaning it is

413

The list is sorted by revision number, meaning it is

414

topologically sorted.

414

topologically sorted.

415

416

'heads' and 'common' are both lists of node IDs. If heads is

416

'heads' and 'common' are both lists of node IDs. If heads is

417

not supplied, uses all of the revlog's heads. If common is not

417

not supplied, uses all of the revlog's heads. If common is not

418

supplied, uses nullid."""

418

supplied, uses nullid."""

419

if common is None:

419

if common is None:

420

common = [nullid]

420

common = [nullid]

421

if heads is None:

421

if heads is None:

422

heads = self.heads()

422

heads = self.heads()

423

424

common = [self.rev(n) for n in common]

424

common = [self.rev(n) for n in common]

425

heads = [self.rev(n) for n in heads]

425

heads = [self.rev(n) for n in heads]

426

427

# we want the ancestors, but inclusive

427

# we want the ancestors, but inclusive

428

has = set(self.ancestors(*common))

428

has = set(self.ancestors(*common))

429

has.add(nullrev)

429

has.add(nullrev)

430

has.update(common)

430

has.update(common)

431

432

# take all ancestors from heads that aren't in has

432

# take all ancestors from heads that aren't in has

433

missing = set()

433

missing = set()

434

visit = [r for r in heads if r not in has]

434

visit = [r for r in heads if r not in has]

435

while visit:

435

while visit:

436

r = visit.pop(0)

436

r = visit.pop(0)

437

if r in missing:

437

if r in missing:

438

continue

438

continue

439

else:

439

else:

440

missing.add(r)

440

missing.add(r)

441

for p in self.parentrevs(r):

441

for p in self.parentrevs(r):

442

if p not in has:

442

if p not in has:

443

visit.append(p)

443

visit.append(p)

444

missing = list(missing)

444

missing = list(missing)

445

missing.sort()

445

missing.sort()

446

return has, [self.node(r) for r in missing]

446

return has, [self.node(r) for r in missing]

447

448

def findmissing(self, common=None, heads=None):

448

def findmissing(self, common=None, heads=None):

449

"""Return the ancestors of heads that are not ancestors of common.

449

"""Return the ancestors of heads that are not ancestors of common.

450

451

More specifically, return a list of nodes N such that every N

451

More specifically, return a list of nodes N such that every N

452

satisfies the following constraints:

452

satisfies the following constraints:

453

454

1. N is an ancestor of some node in 'heads'

454

1. N is an ancestor of some node in 'heads'

455

2. N is not an ancestor of any node in 'common'

455

2. N is not an ancestor of any node in 'common'

456

457

The list is sorted by revision number, meaning it is

457

The list is sorted by revision number, meaning it is

458

topologically sorted.

458

topologically sorted.

459

460

'heads' and 'common' are both lists of node IDs. If heads is

460

'heads' and 'common' are both lists of node IDs. If heads is

461

not supplied, uses all of the revlog's heads. If common is not

461

not supplied, uses all of the revlog's heads. If common is not

462

supplied, uses nullid."""

462

supplied, uses nullid."""

463

_common, missing = self.findcommonmissing(common, heads)

463

_common, missing = self.findcommonmissing(common, heads)

464

return missing

464

return missing

465

466

def nodesbetween(self, roots=None, heads=None):

466

def nodesbetween(self, roots=None, heads=None):

467

"""Return a topological path from 'roots' to 'heads'.

467

"""Return a topological path from 'roots' to 'heads'.

468

469

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

469

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

470

topologically sorted list of all nodes N that satisfy both of

470

topologically sorted list of all nodes N that satisfy both of

471

these constraints:

471

these constraints:

472

473

1. N is a descendant of some node in 'roots'

473

1. N is a descendant of some node in 'roots'

474

2. N is an ancestor of some node in 'heads'

474

2. N is an ancestor of some node in 'heads'

475

476

Every node is considered to be both a descendant and an ancestor

476

Every node is considered to be both a descendant and an ancestor

477

of itself, so every reachable node in 'roots' and 'heads' will be

477

of itself, so every reachable node in 'roots' and 'heads' will be

478

included in 'nodes'.

478

included in 'nodes'.

479

480

'outroots' is the list of reachable nodes in 'roots', i.e., the

480

'outroots' is the list of reachable nodes in 'roots', i.e., the

481

subset of 'roots' that is returned in 'nodes'. Likewise,

481

subset of 'roots' that is returned in 'nodes'. Likewise,

482

'outheads' is the subset of 'heads' that is also in 'nodes'.

482

'outheads' is the subset of 'heads' that is also in 'nodes'.

483

484

'roots' and 'heads' are both lists of node IDs. If 'roots' is

484

'roots' and 'heads' are both lists of node IDs. If 'roots' is

485

unspecified, uses nullid as the only root. If 'heads' is

485

unspecified, uses nullid as the only root. If 'heads' is

486

unspecified, uses list of all of the revlog's heads."""

486

unspecified, uses list of all of the revlog's heads."""

487

nonodes = ([], [], [])

487

nonodes = ([], [], [])

488

if roots is not None:

488

if roots is not None:

489

roots = list(roots)

489

roots = list(roots)

490

if not roots:

490

if not roots:

491

return nonodes

491

return nonodes

492

lowestrev = min([self.rev(n) for n in roots])

492

lowestrev = min([self.rev(n) for n in roots])

493

else:

493

else:

494

roots = [nullid] # Everybody's a descendent of nullid

494

roots = [nullid] # Everybody's a descendent of nullid

495

lowestrev = nullrev

495

lowestrev = nullrev

496

if (lowestrev == nullrev) and (heads is None):

496

if (lowestrev == nullrev) and (heads is None):

497

# We want _all_ the nodes!

497

# We want _all_ the nodes!

498

return ([self.node(r) for r in self], [nullid], list(self.heads()))

498

return ([self.node(r) for r in self], [nullid], list(self.heads()))

499

if heads is None:

499

if heads is None:

500

# All nodes are ancestors, so the latest ancestor is the last

500

# All nodes are ancestors, so the latest ancestor is the last

501

# node.

501

# node.

502

highestrev = len(self) - 1

502

highestrev = len(self) - 1

503

# Set ancestors to None to signal that every node is an ancestor.

503

# Set ancestors to None to signal that every node is an ancestor.

504

ancestors = None

504

ancestors = None

505

# Set heads to an empty dictionary for later discovery of heads

505

# Set heads to an empty dictionary for later discovery of heads

506

heads = {}

506

heads = {}

507

else:

507

else:

508

heads = list(heads)

508

heads = list(heads)

509

if not heads:

509

if not heads:

510

return nonodes

510

return nonodes

511

ancestors = set()

511

ancestors = set()

512

# Turn heads into a dictionary so we can remove 'fake' heads.

512

# Turn heads into a dictionary so we can remove 'fake' heads.

513

# Also, later we will be using it to filter out the heads we can't

513

# Also, later we will be using it to filter out the heads we can't

514

# find from roots.

514

# find from roots.

515

heads = dict.fromkeys(heads, False)

515

heads = dict.fromkeys(heads, False)

516

# Start at the top and keep marking parents until we're done.

516

# Start at the top and keep marking parents until we're done.

517

nodestotag = set(heads)

517

nodestotag = set(heads)

518

# Remember where the top was so we can use it as a limit later.

518

# Remember where the top was so we can use it as a limit later.

519

highestrev = max([self.rev(n) for n in nodestotag])

519

highestrev = max([self.rev(n) for n in nodestotag])

520

while nodestotag:

520

while nodestotag:

521

# grab a node to tag

521

# grab a node to tag

522

n = nodestotag.pop()

522

n = nodestotag.pop()

523

# Never tag nullid

523

# Never tag nullid

524

if n == nullid:

524

if n == nullid:

525

continue

525

continue

526

# A node's revision number represents its place in a

526

# A node's revision number represents its place in a

527

# topologically sorted list of nodes.

527

# topologically sorted list of nodes.

528

r = self.rev(n)

528

r = self.rev(n)

529

if r >= lowestrev:

529

if r >= lowestrev:

530

if n not in ancestors:

530

if n not in ancestors:

531

# If we are possibly a descendent of one of the roots

531

# If we are possibly a descendent of one of the roots

532

# and we haven't already been marked as an ancestor

532

# and we haven't already been marked as an ancestor

533

ancestors.add(n) # Mark as ancestor

533

ancestors.add(n) # Mark as ancestor

534

# Add non-nullid parents to list of nodes to tag.

534

# Add non-nullid parents to list of nodes to tag.

535

nodestotag.update([p for p in self.parents(n) if

535

nodestotag.update([p for p in self.parents(n) if

536

p != nullid])

536

p != nullid])

537

elif n in heads: # We've seen it before, is it a fake head?

537

elif n in heads: # We've seen it before, is it a fake head?

538

# So it is, real heads should not be the ancestors of

538

# So it is, real heads should not be the ancestors of

539

# any other heads.

539

# any other heads.

540

heads.pop(n)

540

heads.pop(n)

541

if not ancestors:

541

if not ancestors:

542

return nonodes

542

return nonodes

543

# Now that we have our set of ancestors, we want to remove any

543

# Now that we have our set of ancestors, we want to remove any

544

# roots that are not ancestors.

544

# roots that are not ancestors.

545

546

# If one of the roots was nullid, everything is included anyway.

546

# If one of the roots was nullid, everything is included anyway.

547

if lowestrev > nullrev:

547

if lowestrev > nullrev:

548

# But, since we weren't, let's recompute the lowest rev to not

548

# But, since we weren't, let's recompute the lowest rev to not

549

# include roots that aren't ancestors.

549

# include roots that aren't ancestors.

550

551

# Filter out roots that aren't ancestors of heads

551

# Filter out roots that aren't ancestors of heads

552

roots = [n for n in roots if n in ancestors]

552

roots = [n for n in roots if n in ancestors]

553

# Recompute the lowest revision

553

# Recompute the lowest revision

554

if roots:

554

if roots:

555

lowestrev = min([self.rev(n) for n in roots])

555

lowestrev = min([self.rev(n) for n in roots])

556

else:

556

else:

557

# No more roots? Return empty list

557

# No more roots? Return empty list

558

return nonodes

558

return nonodes

559

else:

559

else:

560

# We are descending from nullid, and don't need to care about

560

# We are descending from nullid, and don't need to care about

561

# any other roots.

561

# any other roots.

562

lowestrev = nullrev

562

lowestrev = nullrev

563

roots = [nullid]

563

roots = [nullid]

564

# Transform our roots list into a set.

564

# Transform our roots list into a set.

565

descendents = set(roots)

565

descendents = set(roots)

566

# Also, keep the original roots so we can filter out roots that aren't

566

# Also, keep the original roots so we can filter out roots that aren't

567

# 'real' roots (i.e. are descended from other roots).

567

# 'real' roots (i.e. are descended from other roots).

568

roots = descendents.copy()

568

roots = descendents.copy()

569

# Our topologically sorted list of output nodes.

569

# Our topologically sorted list of output nodes.

570

orderedout = []

570

orderedout = []

571

# Don't start at nullid since we don't want nullid in our output list,

571

# Don't start at nullid since we don't want nullid in our output list,

572

# and if nullid shows up in descedents, empty parents will look like

572

# and if nullid shows up in descedents, empty parents will look like

573

# they're descendents.

573

# they're descendents.

574

for r in xrange(max(lowestrev, 0), highestrev + 1):

574

for r in xrange(max(lowestrev, 0), highestrev + 1):

575

n = self.node(r)

575

n = self.node(r)

576

isdescendent = False

576

isdescendent = False

577

if lowestrev == nullrev: # Everybody is a descendent of nullid

577

if lowestrev == nullrev: # Everybody is a descendent of nullid

578

isdescendent = True

578

isdescendent = True

579

elif n in descendents:

579

elif n in descendents:

580

# n is already a descendent

580

# n is already a descendent

581

isdescendent = True

581

isdescendent = True

582

# This check only needs to be done here because all the roots

582

# This check only needs to be done here because all the roots

583

# will start being marked is descendents before the loop.

583

# will start being marked is descendents before the loop.

584

if n in roots:

584

if n in roots:

585

# If n was a root, check if it's a 'real' root.

585

# If n was a root, check if it's a 'real' root.

586

p = tuple(self.parents(n))

586

p = tuple(self.parents(n))

587

# If any of its parents are descendents, it's not a root.

587

# If any of its parents are descendents, it's not a root.

588

if (p[0] in descendents) or (p[1] in descendents):

588

if (p[0] in descendents) or (p[1] in descendents):

589

roots.remove(n)

589

roots.remove(n)

590

else:

590

else:

591

p = tuple(self.parents(n))

591

p = tuple(self.parents(n))

592

# A node is a descendent if either of its parents are

592

# A node is a descendent if either of its parents are

593

# descendents. (We seeded the dependents list with the roots

593

# descendents. (We seeded the dependents list with the roots

594

# up there, remember?)

594

# up there, remember?)

595

if (p[0] in descendents) or (p[1] in descendents):

595

if (p[0] in descendents) or (p[1] in descendents):

596

descendents.add(n)

596

descendents.add(n)

597

isdescendent = True

597

isdescendent = True

598

if isdescendent and ((ancestors is None) or (n in ancestors)):

598

if isdescendent and ((ancestors is None) or (n in ancestors)):

599

# Only include nodes that are both descendents and ancestors.

599

# Only include nodes that are both descendents and ancestors.

600

orderedout.append(n)

600

orderedout.append(n)

601

if (ancestors is not None) and (n in heads):

601

if (ancestors is not None) and (n in heads):

602

# We're trying to figure out which heads are reachable

602

# We're trying to figure out which heads are reachable

603

# from roots.

603

# from roots.

604

# Mark this head as having been reached

604

# Mark this head as having been reached

605

heads[n] = True

605

heads[n] = True

606

elif ancestors is None:

606

elif ancestors is None:

607

# Otherwise, we're trying to discover the heads.

607

# Otherwise, we're trying to discover the heads.

608

# Assume this is a head because if it isn't, the next step

608

# Assume this is a head because if it isn't, the next step

609

# will eventually remove it.

609

# will eventually remove it.

610

heads[n] = True

610

heads[n] = True

611

# But, obviously its parents aren't.

611

# But, obviously its parents aren't.

612

for p in self.parents(n):

612

for p in self.parents(n):

613

heads.pop(p, None)

613

heads.pop(p, None)

614

heads = [n for n, flag in heads.iteritems() if flag]

614

heads = [n for n, flag in heads.iteritems() if flag]

615

roots = list(roots)

615

roots = list(roots)

616

assert orderedout

616

assert orderedout

617

assert roots

617

assert roots

618

assert heads

618

assert heads

619

return (orderedout, roots, heads)

619

return (orderedout, roots, heads)

620

621

def headrevs(self):

621

def headrevs(self):

622

count = len(self)

622

count = len(self)

623

if not count:

623

if not count:

624

return [nullrev]

624

return [nullrev]

625

ishead = [1] * (count + 1)

625

ishead = [1] * (count + 1)

626

index = self.index

626

index = self.index

627

for r in xrange(count):

627

for r in xrange(count):

628

e = index[r]

628

e = index[r]

629

ishead[e[5]] = ishead[e[6]] = 0

629

ishead[e[5]] = ishead[e[6]] = 0

630

return [r for r in xrange(count) if ishead[r]]

630

return [r for r in xrange(count) if ishead[r]]

631

632

def heads(self, start=None, stop=None):

632

def heads(self, start=None, stop=None):

633

"""return the list of all nodes that have no children

633

"""return the list of all nodes that have no children

634

635

if start is specified, only heads that are descendants of

635

if start is specified, only heads that are descendants of

636

start will be returned

636

start will be returned

637

if stop is specified, it will consider all the revs from stop

637

if stop is specified, it will consider all the revs from stop

638

as if they had no children

638

as if they had no children

639

"""

639

"""

640

if start is None and stop is None:

640

if start is None and stop is None:

641

if not len(self):

641

if not len(self):

642

return [nullid]

642

return [nullid]

643

return [self.node(r) for r in self.headrevs()]

643

return [self.node(r) for r in self.headrevs()]

644

645

if start is None:

645

if start is None:

646

start = nullid

646

start = nullid

647

if stop is None:

647

if stop is None:

648

stop = []

648

stop = []

649

stoprevs = set([self.rev(n) for n in stop])

649

stoprevs = set([self.rev(n) for n in stop])

650

startrev = self.rev(start)

650

startrev = self.rev(start)

651

reachable = set((startrev,))

651

reachable = set((startrev,))

652

heads = set((startrev,))

652

heads = set((startrev,))

653

654

parentrevs = self.parentrevs

654

parentrevs = self.parentrevs

655

for r in xrange(startrev + 1, len(self)):

655

for r in xrange(startrev + 1, len(self)):

656

for p in parentrevs(r):

656

for p in parentrevs(r):

657

if p in reachable:

657

if p in reachable:

658

if r not in stoprevs:

658

if r not in stoprevs:

659

reachable.add(r)

659

reachable.add(r)

660

heads.add(r)

660

heads.add(r)

661

if p in heads and p not in stoprevs:

661

if p in heads and p not in stoprevs:

662

heads.remove(p)

662

heads.remove(p)

663

664

return [self.node(r) for r in heads]

664

return [self.node(r) for r in heads]

665

666

def children(self, node):

666

def children(self, node):

667

"""find the children of a given node"""

667

"""find the children of a given node"""

668

c = []

668

c = []

669

p = self.rev(node)

669

p = self.rev(node)

670

for r in range(p + 1, len(self)):

670

for r in range(p + 1, len(self)):

671

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

671

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

672

if prevs:

672

if prevs:

673

for pr in prevs:

673

for pr in prevs:

674

if pr == p:

674

if pr == p:

675

c.append(self.node(r))

675

c.append(self.node(r))

676

elif p == nullrev:

676

elif p == nullrev:

677

c.append(self.node(r))

677

c.append(self.node(r))

678

return c

678

return c

679

680

def descendant(self, start, end):

680

def descendant(self, start, end):

681

if start == nullrev:

681

if start == nullrev:

682

return True

682

return True

683

for i in self.descendants(start):

683

for i in self.descendants(start):

684

if i == end:

684

if i == end:

685

return True

685

return True

686

elif i > end:

686

elif i > end:

687

break

687

break

688

return False

688

return False

689

690

def ancestor(self, a, b):

690

def ancestor(self, a, b):

691

"""calculate the least common ancestor of nodes a and b"""

691

"""calculate the least common ancestor of nodes a and b"""

692

693

# fast path, check if it is a descendant

693

# fast path, check if it is a descendant

694

a, b = self.rev(a), self.rev(b)

694

a, b = self.rev(a), self.rev(b)

695

start, end = sorted((a, b))

695

start, end = sorted((a, b))

696

if self.descendant(start, end):

696

if self.descendant(start, end):

697

return self.node(start)

697

return self.node(start)

698

699

def parents(rev):

699

def parents(rev):

700

return [p for p in self.parentrevs(rev) if p != nullrev]

700

return [p for p in self.parentrevs(rev) if p != nullrev]

701

702

c = ancestor.ancestor(a, b, parents)

702

c = ancestor.ancestor(a, b, parents)

703

if c is None:

703

if c is None:

704

return nullid

704

return nullid

705

706

return self.node(c)

706

return self.node(c)

707

708

def _match(self, id):

708

def _match(self, id):

709

if isinstance(id, (long, int)):

709

if isinstance(id, (long, int)):

710

# rev

710

# rev

711

return self.node(id)

711

return self.node(id)

712

if len(id) == 20:

712

if len(id) == 20:

713

# possibly a binary node

713

# possibly a binary node

714

# odds of a binary node being all hex in ASCII are 1 in 10**25

714

# odds of a binary node being all hex in ASCII are 1 in 10**25

715

try:

715

try:

716

node = id

716

node = id

717

self.rev(node) # quick search the index

717

self.rev(node) # quick search the index

718

return node

718

return node

719

except LookupError:

719

except LookupError:

720

pass # may be partial hex id

720

pass # may be partial hex id

721

try:

721

try:

722

# str(rev)

722

# str(rev)

723

rev = int(id)

723

rev = int(id)

724

if str(rev) != id:

724

if str(rev) != id:

725

raise ValueError

725

raise ValueError

726

if rev < 0:

726

if rev < 0:

727

rev = len(self) + rev

727

rev = len(self) + rev

728

if rev < 0 or rev >= len(self):

728

if rev < 0 or rev >= len(self):

729

raise ValueError

729

raise ValueError

730

return self.node(rev)

730

return self.node(rev)

731

except (ValueError, OverflowError):

731

except (ValueError, OverflowError):

732

pass

732

pass

733

if len(id) == 40:

733

if len(id) == 40:

734

try:

734

try:

735

# a full hex nodeid?

735

# a full hex nodeid?

736

node = bin(id)

736

node = bin(id)

737

self.rev(node)

737

self.rev(node)

738

return node

738

return node

739

except (TypeError, LookupError):

739

except (TypeError, LookupError):

740

pass

740

pass

741

742

def _partialmatch(self, id):

742

def _partialmatch(self, id):

743

if id in self._pcache:

743

if id in self._pcache:

744

return self._pcache[id]

744

return self._pcache[id]

745

746

if len(id) < 40:

746

if len(id) < 40:

747

try:

747

try:

748

# hex(node)[:...]

748

# hex(node)[:...]

749

l = len(id) // 2 # grab an even number of digits

749

l = len(id) // 2 # grab an even number of digits

750

prefix = bin(id[:l * 2])

750

prefix = bin(id[:l * 2])

751

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

751

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

752

nl = [n for n in nl if hex(n).startswith(id)]

752

nl = [n for n in nl if hex(n).startswith(id)]

753

if len(nl) > 0:

753

if len(nl) > 0:

754

if len(nl) == 1:

754

if len(nl) == 1:

755

self._pcache[id] = nl[0]

755

self._pcache[id] = nl[0]

756

return nl[0]

756

return nl[0]

757

raise LookupError(id, self.indexfile,

757

raise LookupError(id, self.indexfile,

758

_('ambiguous identifier'))

758

_('ambiguous identifier'))

759

return None

759

return None

760

except TypeError:

760

except TypeError:

761

pass

761

pass

762

763

def lookup(self, id):

763

def lookup(self, id):

764

"""locate a node based on:

764

"""locate a node based on:

765

- revision number or str(revision number)

765

- revision number or str(revision number)

766

- nodeid or subset of hex nodeid

766

- nodeid or subset of hex nodeid

767

"""

767

"""

768

n = self._match(id)

768

n = self._match(id)

769

if n is not None:

769

if n is not None:

770

return n

770

return n

771

n = self._partialmatch(id)

771

n = self._partialmatch(id)

772

if n:

772

if n:

773

return n

773

return n

774

775

raise LookupError(id, self.indexfile, _('no match found'))

775

raise LookupError(id, self.indexfile, _('no match found'))

776

777

def cmp(self, node, text):

777

def cmp(self, node, text):

778

"""compare text with a given file revision

778

"""compare text with a given file revision

779

780

returns True if text is different than what is stored.

780

returns True if text is different than what is stored.

781

"""

781

"""

782

p1, p2 = self.parents(node)

782

p1, p2 = self.parents(node)

783

return hash(text, p1, p2) != node

783

return hash(text, p1, p2) != node

784

785

def _addchunk(self, offset, data):

785

def _addchunk(self, offset, data):

786

o, d = self._chunkcache

786

o, d = self._chunkcache

787

# try to add to existing cache

787

# try to add to existing cache

788

if o + len(d) == offset and len(d) + len(data) < _chunksize:

788

if o + len(d) == offset and len(d) + len(data) < _chunksize:

789

self._chunkcache = o, d + data

789

self._chunkcache = o, d + data

790

else:

790

else:

791

self._chunkcache = offset, data

791

self._chunkcache = offset, data

792

793

def _loadchunk(self, offset, length):

793

def _loadchunk(self, offset, length):

794

if self._inline:

794

if self._inline:

795

df = self.opener(self.indexfile)

795

df = self.opener(self.indexfile)

796

else:

796

else:

797

df = self.opener(self.datafile)

797

df = self.opener(self.datafile)

798

799

readahead = max(65536, length)

799

readahead = max(65536, length)

800

df.seek(offset)

800

df.seek(offset)

801

d = df.read(readahead)

801

d = df.read(readahead)

802

self._addchunk(offset, d)

802

self._addchunk(offset, d)

803

if readahead > length:

803

if readahead > length:

804

return d[:length]

804

return d[:length]

805

return d

805

return d

806

807

def _getchunk(self, offset, length):

807

def _getchunk(self, offset, length):

808

o, d = self._chunkcache

808

o, d = self._chunkcache

809

l = len(d)

809

l = len(d)

810

811

# is it in the cache?

811

# is it in the cache?

812

cachestart = offset - o

812

cachestart = offset - o

813

cacheend = cachestart + length

813

cacheend = cachestart + length

814

if cachestart >= 0 and cacheend <= l:

814

if cachestart >= 0 and cacheend <= l:

815

if cachestart == 0 and cacheend == l:

815

if cachestart == 0 and cacheend == l:

816

return d # avoid a copy

816

return d # avoid a copy

817

return d[cachestart:cacheend]

817

return d[cachestart:cacheend]

818

819

return self._loadchunk(offset, length)

819

return self._loadchunk(offset, length)

820

821

def _chunkraw(self, startrev, endrev):

821

def _chunkraw(self, startrev, endrev):

822

start = self.start(startrev)

822

start = self.start(startrev)

823

length = self.end(endrev) - start

823

length = self.end(endrev) - start

824

if self._inline:

824

if self._inline:

825

start += (startrev + 1) * self._io.size

825

start += (startrev + 1) * self._io.size

826

return self._getchunk(start, length)

826

return self._getchunk(start, length)

827

828

def _chunk(self, rev):

828

def _chunk(self, rev):

829

return decompress(self._chunkraw(rev, rev))

829

return decompress(self._chunkraw(rev, rev))

830

831

def _chunkbase(self, rev):

831

def _chunkbase(self, rev):

832

return self._chunk(rev)

832

return self._chunk(rev)

833

834

def _chunkclear(self):

834

def _chunkclear(self):

835

self._chunkcache = (0, '')

835

self._chunkcache = (0, '')

836

837

def deltaparent(self, rev):

837

def deltaparent(self, rev):

838

"""return deltaparent of the given revision"""

838

"""return deltaparent of the given revision"""

839

base = self.index[rev][3]

839

base = self.index[rev][3]

840

if base == rev:

840

if base == rev:

841

return nullrev

841

return nullrev

842

elif self._generaldelta:

842

elif self._generaldelta:

843

return base

843

return base

844

else:

844

else:

845

return rev - 1

845

return rev - 1

846

847

def revdiff(self, rev1, rev2):

847

def revdiff(self, rev1, rev2):

848

"""return or calculate a delta between two revisions"""

848

"""return or calculate a delta between two revisions"""

849

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

849

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

850

return self._chunk(rev2)

850

return self._chunk(rev2)

851

852

return mdiff.textdiff(self.revision(self.node(rev1)),

852

return mdiff.textdiff(self.revision(self.node(rev1)),

853

self.revision(self.node(rev2)))

853

self.revision(self.node(rev2)))

854

855

def revision(self, node):

855

def revision(self, node):

856

"""return an uncompressed revision of a given node"""

856

"""return an uncompressed revision of a given node"""

857

cachedrev = None

857

cachedrev = None

858

if node == nullid:

858

if node == nullid:

859

return ""

859

return ""

860

if self._cache:

860

if self._cache:

861

if self._cache[0] == node:

861

if self._cache[0] == node:

862

return self._cache[2]

862

return self._cache[2]

863

cachedrev = self._cache[1]

863

cachedrev = self._cache[1]

864

865

# look up what we need to read

865

# look up what we need to read

866

text = None

866

text = None

867

rev = self.rev(node)

867

rev = self.rev(node)

868

869

# check rev flags

869

# check rev flags

870

if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:

870

if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:

871

raise RevlogError(_('incompatible revision flag %x') %

871

raise RevlogError(_('incompatible revision flag %x') %

872

(self.flags(rev) & ~REVIDX_KNOWN_FLAGS))

872

(self.flags(rev) & ~REVIDX_KNOWN_FLAGS))

873

874

# build delta chain

874

# build delta chain

875

chain = []

875

chain = []

876

index = self.index # for performance

876

index = self.index # for performance

877

generaldelta = self._generaldelta

877

generaldelta = self._generaldelta

878

iterrev = rev

878

iterrev = rev

879

e = index[iterrev]

879

e = index[iterrev]

880

while iterrev != e[3] and iterrev != cachedrev:

880

while iterrev != e[3] and iterrev != cachedrev:

881

chain.append(iterrev)

881

chain.append(iterrev)

882

if generaldelta:

882

if generaldelta:

883

iterrev = e[3]

883

iterrev = e[3]

884

else:

884

else:

885

iterrev -= 1

885

iterrev -= 1

886

e = index[iterrev]

886

e = index[iterrev]

887

chain.reverse()

887

chain.reverse()

888

base = iterrev

888

base = iterrev

889

890

if iterrev == cachedrev:

890

if iterrev == cachedrev:

891

# cache hit

891

# cache hit

892

text = self._cache[2]

892

text = self._cache[2]

893

894

# drop cache to save memory

894

# drop cache to save memory

895

self._cache = None

895

self._cache = None

896

897

self._chunkraw(base, rev)

897

self._chunkraw(base, rev)

898

if text is None:

898

if text is None:

899

text = self._chunkbase(base)

899

text = self._chunkbase(base)

900

901

bins = [self._chunk(r) for r in chain]

901

bins = [self._chunk(r) for r in chain]

902

text = mdiff.patches(text, bins)

902

text = mdiff.patches(text, bins)

903

904

text = self._checkhash(text, node, rev)

904

text = self._checkhash(text, node, rev)

905

906

self._cache = (node, rev, text)

906

self._cache = (node, rev, text)

907

return text

907

return text

908

909

def _checkhash(self, text, node, rev):

909

def _checkhash(self, text, node, rev):

910

p1, p2 = self.parents(node)

910

p1, p2 = self.parents(node)

911

if node != hash(text, p1, p2):

911

if node != hash(text, p1, p2):

912

raise RevlogError(_("integrity check failed on %s:%d")

912

raise RevlogError(_("integrity check failed on %s:%d")

913

% (self.indexfile, rev))

913

% (self.indexfile, rev))

914

return text

914

return text

915

916

def checkinlinesize(self, tr, fp=None):

916

def checkinlinesize(self, tr, fp=None):

917

if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:

917

if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:

918

return

918

return

919

920

trinfo = tr.find(self.indexfile)

920

trinfo = tr.find(self.indexfile)

921

if trinfo is None:

921

if trinfo is None:

922

raise RevlogError(_("%s not found in the transaction")

922

raise RevlogError(_("%s not found in the transaction")

923

% self.indexfile)

923

% self.indexfile)

924

925

trindex = trinfo[2]

925

trindex = trinfo[2]

926

dataoff = self.start(trindex)

926

dataoff = self.start(trindex)

927

928

tr.add(self.datafile, dataoff)

928

tr.add(self.datafile, dataoff)

929

930

if fp:

930

if fp:

931

fp.flush()

931

fp.flush()

932

fp.close()

932

fp.close()

933

934

df = self.opener(self.datafile, 'w')

934

df = self.opener(self.datafile, 'w')

935

try:

935

try:

936

for r in self:

936

for r in self:

937

df.write(self._chunkraw(r, r))

937

df.write(self._chunkraw(r, r))

938

finally:

938

finally:

939

df.close()

939

df.close()

940

941

fp = self.opener(self.indexfile, 'w', atomictemp=True)

941

fp = self.opener(self.indexfile, 'w', atomictemp=True)

942

self.version &= ~(REVLOGNGINLINEDATA)

942

self.version &= ~(REVLOGNGINLINEDATA)

943

self._inline = False

943

self._inline = False

944

for i in self:

944

for i in self:

945

e = self._io.packentry(self.index[i], self.node, self.version, i)

945

e = self._io.packentry(self.index[i], self.node, self.version, i)

946

fp.write(e)

946

fp.write(e)

947

948

# if we don't call rename, the temp file will never replace the

948

# if we don't call rename, the temp file will never replace the

949

# real index

949

# real index

950

fp.rename()

950

fp.rename()

951

952

tr.replace(self.indexfile, trindex * self._io.size)

952

tr.replace(self.indexfile, trindex * self._io.size)

953

self._chunkclear()

953

self._chunkclear()

954

955

def addrevision(self, text, transaction, link, p1, p2, cachedelta=None):

955

def addrevision(self, text, transaction, link, p1, p2, cachedelta=None):

956

"""add a revision to the log

956

"""add a revision to the log

957

958

text - the revision data to add

958

text - the revision data to add

959

transaction - the transaction object used for rollback

959

transaction - the transaction object used for rollback

960

link - the linkrev data to add

960

link - the linkrev data to add

961

p1, p2 - the parent nodeids of the revision

961

p1, p2 - the parent nodeids of the revision

962

cachedelta - an optional precomputed delta

962

cachedelta - an optional precomputed delta

963

"""

963

"""

964

node = hash(text, p1, p2)

964

node = hash(text, p1, p2)

965

if node in self.nodemap:

965

if node in self.nodemap:

966

return node

966

return node

967

968

dfh = None

968

dfh = None

969

if not self._inline:

969

if not self._inline:

970

dfh = self.opener(self.datafile, "a")

970

dfh = self.opener(self.datafile, "a")

971

ifh = self.opener(self.indexfile, "a+")

971

ifh = self.opener(self.indexfile, "a+")

972

try:

972

try:

973

return self._addrevision(node, text, transaction, link, p1, p2,

973

return self._addrevision(node, text, transaction, link, p1, p2,

974

cachedelta, ifh, dfh)

974

cachedelta, ifh, dfh)

975

finally:

975

finally:

976

if dfh:

976

if dfh:

977

dfh.close()

977

dfh.close()

978

ifh.close()

978

ifh.close()

979

980

def _addrevision(self, node, text, transaction, link, p1, p2,

980

def _addrevision(self, node, text, transaction, link, p1, p2,

981

cachedelta, ifh, dfh):

981

cachedelta, ifh, dfh):

982

"""internal function to add revisions to the log

982

"""internal function to add revisions to the log

983

984

see addrevision for argument descriptions.

984

see addrevision for argument descriptions.

985

invariants:

985

invariants:

986

- text is optional (can be None); if not set, cachedelta must be set.

986

- text is optional (can be None); if not set, cachedelta must be set.

987

if both are set, they must correspond to eachother.

987

if both are set, they must correspond to eachother.

988

"""

988

"""

989

btext = [text]

989

btext = [text]

990

def buildtext():

990

def buildtext():

991

if btext[0] is not None:

991

if btext[0] is not None:

992

return btext[0]

992

return btext[0]

993

# flush any pending writes here so we can read it in revision

993

# flush any pending writes here so we can read it in revision

994

if dfh:

994

if dfh:

995

dfh.flush()

995

dfh.flush()

996

ifh.flush()

996

ifh.flush()

997

basetext = self.revision(self.node(cachedelta[0]))

997

basetext = self.revision(self.node(cachedelta[0]))

998

btext[0] = mdiff.patch(basetext, cachedelta[1])

998

btext[0] = mdiff.patch(basetext, cachedelta[1])

999

chk = hash(btext[0], p1, p2)

999

chk = hash(btext[0], p1, p2)

1000

if chk != node:

1000

if chk != node:

1001

raise RevlogError(_("consistency error in delta"))

1001

raise RevlogError(_("consistency error in delta"))

1002

return btext[0]

1002

return btext[0]

1003

1004

def builddelta(rev):

1004

def builddelta(rev):

1005

# can we use the cached delta?

1005

# can we use the cached delta?

1006

if cachedelta and cachedelta[0] == rev:

1006

if cachedelta and cachedelta[0] == rev:

1007

delta = cachedelta[1]

1007

delta = cachedelta[1]

1008

else:

1008

else:

1009

t = buildtext()

1009

t = buildtext()

1010

ptext = self.revision(self.node(rev))

1010

ptext = self.revision(self.node(rev))

1011

delta = mdiff.textdiff(ptext, t)

1011

delta = mdiff.textdiff(ptext, t)

1012

data = compress(delta)

1012

data = compress(delta)

1013

l = len(data[1]) + len(data[0])

1013

l = len(data[1]) + len(data[0])

1014

if basecache[0] == rev:

1014

if basecache[0] == rev:

1015

chainbase = basecache[1]

1015

chainbase = basecache[1]

1016

else:

1016

else:

1017

chainbase = self.chainbase(rev)

1017

chainbase = self.chainbase(rev)

1018

dist = l + offset - self.start(chainbase)

1018

dist = l + offset - self.start(chainbase)

1019

if self._generaldelta:

1019

if self._generaldelta:

1020

base = rev

1020

base = rev

1021

else:

1021

else:

1022

base = chainbase

1022

base = chainbase

1023

return dist, l, data, base, chainbase

1023

return dist, l, data, base, chainbase

1024

1025

curr = len(self)

1025

curr = len(self)

1026

prev = curr - 1

1026

prev = curr - 1

1027

base = chainbase = curr

1027

base = chainbase = curr

1028

offset = self.end(prev)

1028

offset = self.end(prev)

1029

flags = 0

1029

flags = 0

1030

d = None

1030

d = None

1031

basecache = self._basecache

1031

basecache = self._basecache

1032

p1r, p2r = self.rev(p1), self.rev(p2)

1032

p1r, p2r = self.rev(p1), self.rev(p2)

1033

1034

# should we try to build a delta?

1034

# should we try to build a delta?

1035

if prev != nullrev:

1035

if prev != nullrev:

1036

if self._generaldelta:

1036

if self._generaldelta:

1037

if p1r >= basecache[1]:

1037

if p1r >= basecache[1]:

1038

d = builddelta(p1r)

1038

d = builddelta(p1r)

1039

elif p2r >= basecache[1]:

1039

elif p2r >= basecache[1]:

1040

d = builddelta(p2r)

1040

d = builddelta(p2r)

1041

else:

1041

else:

1042

d = builddelta(prev)

1042

d = builddelta(prev)

1043

else:

1043

else:

1044

d = builddelta(prev)

1044

d = builddelta(prev)

1045

dist, l, data, base, chainbase = d

1045

dist, l, data, base, chainbase = d

1046

1047

# full versions are inserted when the needed deltas

1047

# full versions are inserted when the needed deltas

1048

# become comparable to the uncompressed text

1048

# become comparable to the uncompressed text

1049

if text is None:

1049

if text is None:

1050

textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),

1050

textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),

1051

cachedelta[1])

1051

cachedelta[1])

1052

else:

1052

else:

1053

textlen = len(text)

1053

textlen = len(text)

1054

if d is None or dist > textlen * 2:

1054

if d is None or dist > textlen * 2:

1055

text = buildtext()

1055

text = buildtext()

1056

data = compress(text)

1056

data = compress(text)

1057

l = len(data[1]) + len(data[0])

1057

l = len(data[1]) + len(data[0])

1058

base = chainbase = curr

1058

base = chainbase = curr

1059

1060

e = (offset_type(offset, flags), l, textlen,

1060

e = (offset_type(offset, flags), l, textlen,

1061

base, link, p1r, p2r, node)

1061

base, link, p1r, p2r, node)

1062

self.index.insert(-1, e)

1062

self.index.insert(-1, e)

1063

self.nodemap[node] = curr

1063

self.nodemap[node] = curr

1064

1065

entry = self._io.packentry(e, self.node, self.version, curr)

1065

entry = self._io.packentry(e, self.node, self.version, curr)

1066

if not self._inline:

1066

if not self._inline:

1067

transaction.add(self.datafile, offset)

1067

transaction.add(self.datafile, offset)

1068

transaction.add(self.indexfile, curr * len(entry))

1068

transaction.add(self.indexfile, curr * len(entry))

1069

if data[0]:

1069

if data[0]:

1070

dfh.write(data[0])

1070

dfh.write(data[0])

1071

dfh.write(data[1])

1071

dfh.write(data[1])

1072

dfh.flush()

1072

dfh.flush()

1073

ifh.write(entry)

1073

ifh.write(entry)

1074

else:

1074

else:

1075

offset += curr * self._io.size

1075

offset += curr * self._io.size

1076

transaction.add(self.indexfile, offset, curr)

1076

transaction.add(self.indexfile, offset, curr)

1077

ifh.write(entry)

1077

ifh.write(entry)

1078

ifh.write(data[0])

1078

ifh.write(data[0])

1079

ifh.write(data[1])

1079

ifh.write(data[1])

1080

self.checkinlinesize(transaction, ifh)

1080

self.checkinlinesize(transaction, ifh)

1081

1082

if type(text) == str: # only accept immutable objects

1082

if type(text) == str: # only accept immutable objects

1083

self._cache = (node, curr, text)

1083

self._cache = (node, curr, text)

1084

self._basecache = (curr, chainbase)

1084

self._basecache = (curr, chainbase)

1085

return node

1085

return node

1086

1087

def group(self, nodelist, bundler, reorder=None):

1087

def group(self, nodelist, bundler, reorder=None):

1088

"""Calculate a delta group, yielding a sequence of changegroup chunks

1088

"""Calculate a delta group, yielding a sequence of changegroup chunks

1089

(strings).

1089

(strings).

1090

1091

Given a list of changeset revs, return a set of deltas and

1091

Given a list of changeset revs, return a set of deltas and

1092

metadata corresponding to nodes. The first delta is

1092

metadata corresponding to nodes. The first delta is

1093

first parent(nodelist[0]) -> nodelist[0], the receiver is

1093

first parent(nodelist[0]) -> nodelist[0], the receiver is

1094

guaranteed to have this parent as it has all history before

1094

guaranteed to have this parent as it has all history before

1095

these changesets. In the case firstparent is nullrev the

1095

these changesets. In the case firstparent is nullrev the

1096

changegroup starts with a full revision.

1096

changegroup starts with a full revision.

1097

"""

1097

"""

1098

1099

# if we don't have any revisions touched by these changesets, bail

1100

if len(nodelist) == 0:

1101

yield bundler.close()

1102

return

1103

1099

# for generaldelta revlogs, we linearize the revs; this will both be

1104

# for generaldelta revlogs, we linearize the revs; this will both be

1100

# much quicker and generate a much smaller bundle

1105

# much quicker and generate a much smaller bundle

1101

if (self._generaldelta and reorder is not False) or reorder:

1106

if (self._generaldelta and reorder is not False) or reorder:

1102

dag = dagutil.revlogdag(self)

1107

dag = dagutil.revlogdag(self)

1103

revs = set(self.rev(n) for n in nodelist)

1108

revs = set(self.rev(n) for n in nodelist)

1104

revs = dag.linearize(revs)

1109

revs = dag.linearize(revs)

1105

else:

1110

else:

1106

revs = sorted([self.rev(n) for n in nodelist])

1111

revs = sorted([self.rev(n) for n in nodelist])

1107

1112

1108

# if we don't have any revisions touched by these changesets, bail

1109

if not revs:

1110

yield bundler.close()

1111

return

1112

1113

# add the parent of the first rev

1113

# add the parent of the first rev

1114

p = self.parentrevs(revs[0])[0]

1114

p = self.parentrevs(revs[0])[0]

1115

revs.insert(0, p)

1115

revs.insert(0, p)

1116

1117

# build deltas

1117

# build deltas

1118

for r in xrange(len(revs) - 1):

1118

for r in xrange(len(revs) - 1):

1119

prev, curr = revs[r], revs[r + 1]

1119

prev, curr = revs[r], revs[r + 1]

1120

for c in bundler.revchunk(self, curr, prev):

1120

for c in bundler.revchunk(self, curr, prev):

1121

yield c

1121

yield c

1122

1123

yield bundler.close()

1123

yield bundler.close()

1124

1125

def addgroup(self, bundle, linkmapper, transaction):

1125

def addgroup(self, bundle, linkmapper, transaction):

1126

"""

1126

"""

1127

add a delta group

1127

add a delta group

1128

1129

given a set of deltas, add them to the revision log. the

1129

given a set of deltas, add them to the revision log. the

1130

first delta is against its parent, which should be in our

1130

first delta is against its parent, which should be in our

1131

log, the rest are against the previous delta.

1131

log, the rest are against the previous delta.

1132

"""

1132

"""

1133

1134

# track the base of the current delta log

1134

# track the base of the current delta log

1135

node = None

1135

node = None

1136

1137

r = len(self)

1137

r = len(self)

1138

end = 0

1138

end = 0

1139

if r:

1139

if r:

1140

end = self.end(r - 1)

1140

end = self.end(r - 1)

1141

ifh = self.opener(self.indexfile, "a+")

1141

ifh = self.opener(self.indexfile, "a+")

1142

isize = r * self._io.size

1142

isize = r * self._io.size

1143

if self._inline:

1143

if self._inline:

1144

transaction.add(self.indexfile, end + isize, r)

1144

transaction.add(self.indexfile, end + isize, r)

1145

dfh = None

1145

dfh = None

1146

else:

1146

else:

1147

transaction.add(self.indexfile, isize, r)

1147

transaction.add(self.indexfile, isize, r)

1148

transaction.add(self.datafile, end)

1148

transaction.add(self.datafile, end)

1149

dfh = self.opener(self.datafile, "a")

1149

dfh = self.opener(self.datafile, "a")

1150

1151

try:

1151

try:

1152

# loop through our set of deltas

1152

# loop through our set of deltas

1153

chain = None

1153

chain = None

1154

while True:

1154

while True:

1155

chunkdata = bundle.deltachunk(chain)

1155

chunkdata = bundle.deltachunk(chain)

1156

if not chunkdata:

1156

if not chunkdata:

1157

break

1157

break

1158

node = chunkdata['node']

1158

node = chunkdata['node']

1159

p1 = chunkdata['p1']

1159

p1 = chunkdata['p1']

1160

p2 = chunkdata['p2']

1160

p2 = chunkdata['p2']

1161

cs = chunkdata['cs']

1161

cs = chunkdata['cs']

1162

deltabase = chunkdata['deltabase']

1162

deltabase = chunkdata['deltabase']

1163

delta = chunkdata['delta']

1163

delta = chunkdata['delta']

1164

1165

link = linkmapper(cs)

1165

link = linkmapper(cs)

1166

if node in self.nodemap:

1166

if node in self.nodemap:

1167

# this can happen if two branches make the same change

1167

# this can happen if two branches make the same change

1168

chain = node

1168

chain = node

1169

continue

1169

continue

1170

1171

for p in (p1, p2):

1171

for p in (p1, p2):

1172

if not p in self.nodemap:

1172

if not p in self.nodemap:

1173

raise LookupError(p, self.indexfile,

1173

raise LookupError(p, self.indexfile,

1174

_('unknown parent'))

1174

_('unknown parent'))

1175

1176

if deltabase not in self.nodemap:

1176

if deltabase not in self.nodemap:

1177

raise LookupError(deltabase, self.indexfile,

1177

raise LookupError(deltabase, self.indexfile,

1178

_('unknown delta base'))

1178

_('unknown delta base'))

1179

1180

baserev = self.rev(deltabase)

1180

baserev = self.rev(deltabase)

1181

chain = self._addrevision(node, None, transaction, link,

1181

chain = self._addrevision(node, None, transaction, link,

1182

p1, p2, (baserev, delta), ifh, dfh)

1182

p1, p2, (baserev, delta), ifh, dfh)

1183

if not dfh and not self._inline:

1183

if not dfh and not self._inline:

1184

# addrevision switched from inline to conventional

1184

# addrevision switched from inline to conventional

1185

# reopen the index

1185

# reopen the index

1186

ifh.close()

1186

ifh.close()

1187

dfh = self.opener(self.datafile, "a")

1187

dfh = self.opener(self.datafile, "a")

1188

ifh = self.opener(self.indexfile, "a")

1188

ifh = self.opener(self.indexfile, "a")

1189

finally:

1189

finally:

1190

if dfh:

1190

if dfh:

1191

dfh.close()

1191

dfh.close()

1192

ifh.close()

1192

ifh.close()

1193

1194

return node

1194

return node

1195

1196

def strip(self, minlink, transaction):

1196

def strip(self, minlink, transaction):

1197

"""truncate the revlog on the first revision with a linkrev >= minlink

1197

"""truncate the revlog on the first revision with a linkrev >= minlink

1198

1199

This function is called when we're stripping revision minlink and

1199

This function is called when we're stripping revision minlink and

1200

its descendants from the repository.

1200

its descendants from the repository.

1201

1202

We have to remove all revisions with linkrev >= minlink, because

1202

We have to remove all revisions with linkrev >= minlink, because

1203

the equivalent changelog revisions will be renumbered after the

1203

the equivalent changelog revisions will be renumbered after the

1204

strip.

1204

strip.

1205

1206

So we truncate the revlog on the first of these revisions, and

1206

So we truncate the revlog on the first of these revisions, and

1207

trust that the caller has saved the revisions that shouldn't be

1207

trust that the caller has saved the revisions that shouldn't be

1208

removed and that it'll readd them after this truncation.

1208

removed and that it'll readd them after this truncation.

1209

"""

1209

"""

1210

if len(self) == 0:

1210

if len(self) == 0:

1211

return

1211

return

1212

1213

for rev in self:

1213

for rev in self:

1214

if self.index[rev][4] >= minlink:

1214

if self.index[rev][4] >= minlink:

1215

break

1215

break

1216

else:

1216

else:

1217

return

1217

return

1218

1219

# first truncate the files on disk

1219

# first truncate the files on disk

1220

end = self.start(rev)

1220

end = self.start(rev)

1221

if not self._inline:

1221

if not self._inline:

1222

transaction.add(self.datafile, end)

1222

transaction.add(self.datafile, end)

1223

end = rev * self._io.size

1223

end = rev * self._io.size

1224

else:

1224

else:

1225

end += rev * self._io.size

1225

end += rev * self._io.size

1226

1227

transaction.add(self.indexfile, end)

1227

transaction.add(self.indexfile, end)

1228

1229

# then reset internal state in memory to forget those revisions

1229

# then reset internal state in memory to forget those revisions

1230

self._cache = None

1230

self._cache = None

1231

self._chunkclear()

1231

self._chunkclear()

1232

for x in xrange(rev, len(self)):

1232

for x in xrange(rev, len(self)):

1233

del self.nodemap[self.node(x)]

1233

del self.nodemap[self.node(x)]

1234

1235

del self.index[rev:-1]

1235

del self.index[rev:-1]

1236

1237

def checksize(self):

1237

def checksize(self):

1238

expected = 0

1238

expected = 0

1239

if len(self):

1239

if len(self):

1240

expected = max(0, self.end(len(self) - 1))

1240

expected = max(0, self.end(len(self) - 1))

1241

1242

try:

1242

try:

1243

f = self.opener(self.datafile)

1243

f = self.opener(self.datafile)

1244

f.seek(0, 2)

1244

f.seek(0, 2)

1245

actual = f.tell()

1245

actual = f.tell()

1246

f.close()

1246

f.close()

1247

dd = actual - expected

1247

dd = actual - expected

1248

except IOError, inst:

1248

except IOError, inst:

1249

if inst.errno != errno.ENOENT:

1249

if inst.errno != errno.ENOENT:

1250

raise

1250

raise

1251

dd = 0

1251

dd = 0

1252

1253

try:

1253

try:

1254

f = self.opener(self.indexfile)

1254

f = self.opener(self.indexfile)

1255

f.seek(0, 2)

1255

f.seek(0, 2)

1256

actual = f.tell()

1256

actual = f.tell()

1257

f.close()

1257

f.close()

1258

s = self._io.size

1258

s = self._io.size

1259

i = max(0, actual // s)

1259

i = max(0, actual // s)

1260

di = actual - (i * s)

1260

di = actual - (i * s)

1261

if self._inline:

1261

if self._inline:

1262

databytes = 0

1262

databytes = 0

1263

for r in self:

1263

for r in self:

1264

databytes += max(0, self.length(r))

1264

databytes += max(0, self.length(r))

1265

dd = 0

1265

dd = 0

1266

di = actual - len(self) * s - databytes

1266

di = actual - len(self) * s - databytes

1267

except IOError, inst:

1267

except IOError, inst:

1268

if inst.errno != errno.ENOENT:

1268

if inst.errno != errno.ENOENT:

1269

raise

1269

raise

1270

di = 0

1270

di = 0

1271

1272

return (dd, di)

1272

return (dd, di)

1273

1274

def files(self):

1274

def files(self):

1275

res = [self.indexfile]

1275

res = [self.indexfile]

1276

if not self._inline:

1276

if not self._inline:

1277

res.append(self.datafile)

1277

res.append(self.datafile)

1278

return res

1278

return res

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # revlog.py - storage back-end for mercurial
             #
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             # import stuff from node for others to import from revlog
             from node import bin, hex, nullid, nullrev
             from i18n import _
             import ancestor, mdiff, parsers, error, util, dagutil
             import struct, zlib, errno
             _pack = struct.pack
             _unpack = struct.unpack
             _compress = zlib.compress
             _decompress = zlib.decompress
             _sha = util.sha1
             # revlog header flags
             REVLOGV0 = 0
             REVLOGNG = 1
             REVLOGNGINLINEDATA = (1 << 16)
             REVLOGGENERALDELTA = (1 << 17)
             REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA
             REVLOG_DEFAULT_FORMAT = REVLOGNG
             REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS
             REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGGENERALDELTA
             # revlog index flags
             REVIDX_KNOWN_FLAGS = 0
             # max size of revlog with inline data
             _maxinline = 131072
             _chunksize = 1048576
             RevlogError = error.RevlogError
             LookupError = error.LookupError
             def getoffset(q):
                 return int(q >> 16)
             def gettype(q):
                 return int(q & 0xFFFF)
             def offset_type(offset, type):
                 return long(long(offset) << 16 | type)
             nullhash = _sha(nullid)
             def hash(text, p1, p2):
                 """generate a hash from the given text and its parent hashes
                 This hash combines both the current file contents and its history
                 in a manner that makes it easy to distinguish nodes with the same
                 content in the revision graph.
                 """
                 # As of now, if one of the parent node is null, p2 is null
                 if p2 == nullid:
                     # deep copy of a hash is faster than creating one
                     s = nullhash.copy()
                     s.update(p1)
                 else:
                     # none of the parent nodes are nullid
                     l = [p1, p2]
                     l.sort()
                     s = _sha(l[0])
                     s.update(l[1])
                 s.update(text)
                 return s.digest()
             def compress(text):
                 """ generate a possibly-compressed representation of text """
                 if not text:
                     return ("", text)
                 l = len(text)
                 bin = None
                 if l < 44:
                     pass
                 elif l > 1000000:
                     # zlib makes an internal copy, thus doubling memory usage for
                     # large files, so lets do this in pieces
                     z = zlib.compressobj()
                     p = []
                     pos = 0
                     while pos < l:
                         pos2 = pos + 2**20
                         p.append(z.compress(text[pos:pos2]))
                         pos = pos2
                     p.append(z.flush())
                     if sum(map(len, p)) < l:
                         bin = "".join(p)
                 else:
                     bin = _compress(text)
                 if bin is None or len(bin) > l:
                     if text[0] == '\0':
                         return ("", text)
                     return ('u', text)
                 return ("", bin)
             def decompress(bin):
                 """ decompress the given input """
                 if not bin:
                     return bin
                 t = bin[0]
                 if t == '\0':
                     return bin
                 if t == 'x':
                     return _decompress(bin)
                 if t == 'u':
                     return bin[1:]
                 raise RevlogError(_("unknown compression type %r") % t)
             indexformatv0 = ">4l20s20s20s"
             v0shaoffset = 56
             class revlogoldio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatv0)
                 def parseindex(self, data, inline):
                     s = self.size
                     index = []
                     nodemap =  {nullid: nullrev}
                     n = off = 0
                     l = len(data)
                     while off + s <= l:
                         cur = data[off:off + s]
                         off += s
                         e = _unpack(indexformatv0, cur)
                         # transform to revlogv1 format
                         e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],
                               nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])
                         index.append(e2)
                         nodemap[e[6]] = n
                         n += 1
                     # add the magic null revision at -1
                     index.append((0, 0, 0, -1, -1, -1, -1, nullid))
                     return index, nodemap, None
                 def packentry(self, entry, node, version, rev):
                     if gettype(entry[0]):
                         raise RevlogError(_("index entry flags need RevlogNG"))
                     e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],
                           node(entry[5]), node(entry[6]), entry[7])
                     return _pack(indexformatv0, *e2)
             # index ng:
             #  6 bytes: offset
             #  2 bytes: flags
             #  4 bytes: compressed length
             #  4 bytes: uncompressed length
             #  4 bytes: base rev
             #  4 bytes: link rev
             #  4 bytes: parent 1 rev
             #  4 bytes: parent 2 rev
             # 32 bytes: nodeid
             indexformatng = ">Qiiiiii20s12x"
             ngshaoffset = 32
             versionformat = ">I"
             class revlogio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatng)
                 def parseindex(self, data, inline):
                     # call the C implementation to parse the index data
                     index, cache = parsers.parse_index2(data, inline)
                     return index, None, cache
                 def packentry(self, entry, node, version, rev):
                     p = _pack(indexformatng, *entry)
                     if rev == 0:
                         p = _pack(versionformat, version) + p[4:]
                     return p
             class revlog(object):
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 """
                 def __init__(self, opener, indexfile):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     """
                     self.indexfile = indexfile
                     self.datafile = indexfile[:-2] + ".d"
                     self.opener = opener
                     self._cache = None
                     self._basecache = (0, 0)
                     self._chunkcache = (0, '')
                     self.index = []
                     self._pcache = {}
                     self._nodecache = {nullid: nullrev}
                     self._nodepos = None
                     v = REVLOG_DEFAULT_VERSION
                     if hasattr(opener, 'options'):
                         if 'revlogv1' in opener.options:
                             if 'generaldelta' in opener.options:
                                 v |= REVLOGGENERALDELTA
                         else:
                             v = 0
                     i = ''
                     self._initempty = True
                     try:
                         f = self.opener(self.indexfile)
                         i = f.read()
                         f.close()
                         if len(i) > 0:
                             v = struct.unpack(versionformat, i[:4])[0]
                             self._initempty = False
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                     self.version = v
                     self._inline = v & REVLOGNGINLINEDATA
                     self._generaldelta = v & REVLOGGENERALDELTA
                     flags = v & ~0xFFFF
                     fmt = v & 0xFFFF
                     if fmt == REVLOGV0 and flags:
                         raise RevlogError(_("index %s unknown flags %#04x for format v0")
                                           % (self.indexfile, flags >> 16))
                     elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:
                         raise RevlogError(_("index %s unknown flags %#04x for revlogng")
                                           % (self.indexfile, flags >> 16))
                     elif fmt > REVLOGNG:
                         raise RevlogError(_("index %s unknown format %d")
                                           % (self.indexfile, fmt))
                     self._io = revlogio()
                     if self.version == REVLOGV0:
                         self._io = revlogoldio()
                     try:
                         d = self._io.parseindex(i, self._inline)
                     except (ValueError, IndexError):
                         raise RevlogError(_("index %s is corrupted") % (self.indexfile))
                     self.index, nodemap, self._chunkcache = d
                     if nodemap is not None:
                         self.nodemap = self._nodecache = nodemap
                     if not self._chunkcache:
                         self._chunkclear()
                 def tip(self):
                     return self.node(len(self.index) - 2)
                 def __len__(self):
                     return len(self.index) - 1
                 def __iter__(self):
                     for i in xrange(len(self)):
                         yield i
                 @util.propertycache
                 def nodemap(self):
                     self.rev(self.node(0))
                     return self._nodecache
                 def rev(self, node):
                     try:
                         return self._nodecache[node]
                     except KeyError:
                         n = self._nodecache
                         i = self.index
                         p = self._nodepos
                         if p is None:
                             p = len(i) - 2
                         for r in xrange(p, -1, -1):
                             v = i[r][7]
                             n[v] = r
                             if v == node:
                                 self._nodepos = r - 1
                                 return r
                         raise LookupError(node, self.indexfile, _('no node'))
                 def node(self, rev):
                     return self.index[rev][7]
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline
                 def parentrevs(self, rev):
                     return self.index[rev][5:7]
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def length(self, rev):
                     return self.index[rev][1]
                 def chainbase(self, rev):
                     index = self.index
                     base = index[rev][3]
                     while base != rev:
                         rev = base
                         base = index[rev][3]
                     return base
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.revision(self.node(rev))
                     return len(t)
                 size = rawsize
                 def reachable(self, node, stop=None):
                     """return the set of all nodes ancestral to a given node, including
                      the node itself, stopping when stop is matched"""
                     reachable = set((node,))
                     visit = [node]
                     if stop:
                         stopn = self.rev(stop)
                     else:
                         stopn = 0
                     while visit:
                         n = visit.pop(0)
                         if n == stop:
                             continue
                         if n == nullid:
                             continue
                         for p in self.parents(n):
                             if self.rev(p) < stopn:
                                 continue
                             if p not in reachable:
                                 reachable.add(p)
                                 visit.append(p)
                     return reachable
                 def ancestors(self, *revs):
                     """Generate the ancestors of 'revs' in reverse topological order.
                     Yield a sequence of revision numbers starting with the parents
                     of each revision in revs, i.e., each revision is *not* considered
                     an ancestor of itself.  Results are in breadth-first order:
                     parents of each rev in revs, then parents of those, etc.  Result
                     does not include the null revision."""
                     visit = list(revs)
                     seen = set([nullrev])
                     while visit:
                         for parent in self.parentrevs(visit.pop(0)):
                             if parent not in seen:
                                 visit.append(parent)
                                 seen.add(parent)
                                 yield parent
                 def descendants(self, *revs):
                     """Generate the descendants of 'revs' in revision order.
                     Yield a sequence of revision numbers starting with a child of
                     some rev in revs, i.e., each revision is *not* considered a
                     descendant of itself.  Results are ordered by revision number (a
                     topological sort)."""
                     first = min(revs)
                     if first == nullrev:
                         for i in self:
                             yield i
                         return
                     seen = set(revs)
                     for i in xrange(first + 1, len(self)):
                         for x in self.parentrevs(i):
                             if x != nullrev and x in seen:
                                 seen.add(i)
                                 yield i
                                 break
                 def findcommonmissing(self, common=None, heads=None):
                     """Return a tuple of the ancestors of common and the ancestors of heads
                     that are not ancestors of common.
                     More specifically, the second element is a list of nodes N such that
                     every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     has = set(self.ancestors(*common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = [r for r in heads if r not in has]
                     while visit:
                         r = visit.pop(0)
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return has, [self.node(r) for r in missing]
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     _common, missing = self.findcommonmissing(common, heads)
                     return missing
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [nullid] # Everybody's a descendent of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return ([self.node(r) for r in self], [nullid], list(self.heads()))
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, False)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendent of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n) # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update([p for p in self.parents(n) if
                                                        p != nullid])
                                 elif n in heads: # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [n for n in roots if n in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(n) for n in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [nullid]
                     # Transform our roots list into a set.
                     descendents = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendents.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descedents, empty parents will look like
                     # they're descendents.
                     for r in xrange(max(lowestrev, 0), highestrev + 1):
                         n = self.node(r)
                         isdescendent = False
                         if lowestrev == nullrev:  # Everybody is a descendent of nullid
                             isdescendent = True
                         elif n in descendents:
                             # n is already a descendent
                             isdescendent = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendents before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendents, it's not a root.
                                 if (p[0] in descendents) or (p[1] in descendents):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendent if either of its parents are
                             # descendents.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendents) or (p[1] in descendents):
                                 descendents.add(n)
                                 isdescendent = True
                         if isdescendent and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendents and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = True
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = True
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [n for n, flag in heads.iteritems() if flag]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def headrevs(self):
                     count = len(self)
                     if not count:
                         return [nullrev]
                     ishead = [1] * (count + 1)
                     index = self.index
                     for r in xrange(count):
                         e = index[r]
                         ishead[e[5]] = ishead[e[6]] = 0
                     return [r for r in xrange(count) if ishead[r]]
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         if not len(self):
                             return [nullid]
                         return [self.node(r) for r in self.headrevs()]
                     if start is None:
                         start = nullid
                     if stop is None:
                         stop = []
                     stoprevs = set([self.rev(n) for n in stop])
                     startrev = self.rev(start)
                     reachable = set((startrev,))
                     heads = set((startrev,))
                     parentrevs = self.parentrevs
                     for r in xrange(startrev + 1, len(self)):
                         for p in parentrevs(r):
                             if p in reachable:
                                 if r not in stoprevs:
                                     reachable.add(r)
                                 heads.add(r)
                             if p in heads and p not in stoprevs:
                                 heads.remove(p)
                     return [self.node(r) for r in heads]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in range(p + 1, len(self)):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def descendant(self, start, end):
                     if start == nullrev:
                         return True
                     for i in self.descendants(start):
                         if i == end:
                             return True
                         elif i > end:
                             break
                     return False
                 def ancestor(self, a, b):
                     """calculate the least common ancestor of nodes a and b"""
                     # fast path, check if it is a descendant
                     a, b = self.rev(a), self.rev(b)
                     start, end = sorted((a, b))
                     if self.descendant(start, end):
                         return self.node(start)
                     def parents(rev):
                         return [p for p in self.parentrevs(rev) if p != nullrev]
                     c = ancestor.ancestor(a, b, parents)
                     if c is None:
                         return nullid
                     return self.node(c)
                 def _match(self, id):
                     if isinstance(id, (long, int)):
                         # rev
                         return self.node(id)
                     if len(id) == 20:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node) # quick search the index
                             return node
                         except LookupError:
                             pass # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if str(rev) != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 40:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (TypeError, LookupError):
                             pass
                 def _partialmatch(self, id):
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) < 40:
                         try:
                             # hex(node)[:...]
                             l = len(id) // 2  # grab an even number of digits
                             prefix = bin(id[:l * 2])
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [n for n in nl if hex(n).startswith(id)]
                             if len(nl) > 0:
                                 if len(nl) == 1:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise LookupError(id, self.indexfile,
                                                   _('ambiguous identifier'))
                             return None
                         except TypeError:
                             pass
                 def lookup(self, id):
                     """locate a node based on:
                         - revision number or str(revision number)
                         - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise LookupError(id, self.indexfile, _('no match found'))
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return hash(text, p1, p2) != node
                 def _addchunk(self, offset, data):
                     o, d = self._chunkcache
                     # try to add to existing cache
                     if o + len(d) == offset and len(d) + len(data) < _chunksize:
                         self._chunkcache = o, d + data
                     else:
                         self._chunkcache = offset, data
                 def _loadchunk(self, offset, length):
                     if self._inline:
                         df = self.opener(self.indexfile)
                     else:
                         df = self.opener(self.datafile)
                     readahead = max(65536, length)
                     df.seek(offset)
                     d = df.read(readahead)
                     self._addchunk(offset, d)
                     if readahead > length:
                         return d[:length]
                     return d
                 def _getchunk(self, offset, length):
                     o, d = self._chunkcache
                     l = len(d)
                     # is it in the cache?
                     cachestart = offset - o
                     cacheend = cachestart + length
                     if cachestart >= 0 and cacheend <= l:
                         if cachestart == 0 and cacheend == l:
                             return d # avoid a copy
                         return d[cachestart:cacheend]
                     return self._loadchunk(offset, length)
                 def _chunkraw(self, startrev, endrev):
                     start = self.start(startrev)
                     length = self.end(endrev) - start
                     if self._inline:
                         start += (startrev + 1) * self._io.size
                     return self._getchunk(start, length)
                 def _chunk(self, rev):
                     return decompress(self._chunkraw(rev, rev))
                 def _chunkbase(self, rev):
                     return self._chunk(rev)
                 def _chunkclear(self):
                     self._chunkcache = (0, '')
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     base = self.index[rev][3]
                     if base == rev:
                         return nullrev
                     elif self._generaldelta:
                         return base
                     else:
                         return rev - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions"""
                     if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                         return self._chunk(rev2)
                     return mdiff.textdiff(self.revision(self.node(rev1)),
                                           self.revision(self.node(rev2)))
                 def revision(self, node):
                     """return an uncompressed revision of a given node"""
                     cachedrev = None
                     if node == nullid:
                         return ""
                     if self._cache:
                         if self._cache[0] == node:
                             return self._cache[2]
                         cachedrev = self._cache[1]
                     # look up what we need to read
                     text = None
                     rev = self.rev(node)
                     # check rev flags
                     if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:
                         raise RevlogError(_('incompatible revision flag %x') %
                                           (self.flags(rev) & ~REVIDX_KNOWN_FLAGS))
                     # build delta chain
                     chain = []
                     index = self.index # for performance
                     generaldelta = self._generaldelta
                     iterrev = rev
                     e = index[iterrev]
                     while iterrev != e[3] and iterrev != cachedrev:
                         chain.append(iterrev)
                         if generaldelta:
                             iterrev = e[3]
                         else:
                             iterrev -= 1
                         e = index[iterrev]
                     chain.reverse()
                     base = iterrev
                     if iterrev == cachedrev:
                         # cache hit
                         text = self._cache[2]
                     # drop cache to save memory
                     self._cache = None
                     self._chunkraw(base, rev)
                     if text is None:
                         text = self._chunkbase(base)
                     bins = [self._chunk(r) for r in chain]
                     text = mdiff.patches(text, bins)
                     text = self._checkhash(text, node, rev)
                     self._cache = (node, rev, text)
                     return text
                 def _checkhash(self, text, node, rev):
                     p1, p2 = self.parents(node)
                     if node != hash(text, p1, p2):
                         raise RevlogError(_("integrity check failed on %s:%d")
                                           % (self.indexfile, rev))
                     return text
                 def checkinlinesize(self, tr, fp=None):
                     if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:
                         return
                     trinfo = tr.find(self.indexfile)
                     if trinfo is None:
                         raise RevlogError(_("%s not found in the transaction")
                                           % self.indexfile)
                     trindex = trinfo[2]
                     dataoff = self.start(trindex)
                     tr.add(self.datafile, dataoff)
                     if fp:
                         fp.flush()
                         fp.close()
                     df = self.opener(self.datafile, 'w')
                     try:
                         for r in self:
                             df.write(self._chunkraw(r, r))
                     finally:
                         df.close()
                     fp = self.opener(self.indexfile, 'w', atomictemp=True)
                     self.version &= ~(REVLOGNGINLINEDATA)
                     self._inline = False
                     for i in self:
                         e = self._io.packentry(self.index[i], self.node, self.version, i)
                         fp.write(e)
                     # if we don't call rename, the temp file will never replace the
                     # real index
                     fp.rename()
                     tr.replace(self.indexfile, trindex * self._io.size)
                     self._chunkclear()
                 def addrevision(self, text, transaction, link, p1, p2, cachedelta=None):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     """
                     node = hash(text, p1, p2)
                     if node in self.nodemap:
                         return node
                     dfh = None
                     if not self._inline:
                         dfh = self.opener(self.datafile, "a")
                     ifh = self.opener(self.indexfile, "a+")
                     try:
                         return self._addrevision(node, text, transaction, link, p1, p2,
                                                  cachedelta, ifh, dfh)
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                 def _addrevision(self, node, text, transaction, link, p1, p2,
                                  cachedelta, ifh, dfh):
                     """internal function to add revisions to the log
                     see addrevision for argument descriptions.
                     invariants:
                     - text is optional (can be None); if not set, cachedelta must be set.
                       if both are set, they must correspond to eachother.
                     """
                     btext = [text]
                     def buildtext():
                         if btext[0] is not None:
                             return btext[0]
                         # flush any pending writes here so we can read it in revision
                         if dfh:
                             dfh.flush()
                         ifh.flush()
                         basetext = self.revision(self.node(cachedelta[0]))
                         btext[0] = mdiff.patch(basetext, cachedelta[1])
                         chk = hash(btext[0], p1, p2)
                         if chk != node:
                             raise RevlogError(_("consistency error in delta"))
                         return btext[0]
                     def builddelta(rev):
                         # can we use the cached delta?
                         if cachedelta and cachedelta[0] == rev:
                             delta = cachedelta[1]
                         else:
                             t = buildtext()
                             ptext = self.revision(self.node(rev))
                             delta = mdiff.textdiff(ptext, t)
                         data = compress(delta)
                         l = len(data[1]) + len(data[0])
                         if basecache[0] == rev:
                             chainbase = basecache[1]
                         else:
                             chainbase = self.chainbase(rev)
                         dist = l + offset - self.start(chainbase)
                         if self._generaldelta:
                             base = rev
                         else:
                             base = chainbase
                         return dist, l, data, base, chainbase
                     curr = len(self)
                     prev = curr - 1
                     base = chainbase = curr
                     offset = self.end(prev)
                     flags = 0
                     d = None
                     basecache = self._basecache
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # should we try to build a delta?
                     if prev != nullrev:
                         if self._generaldelta:
                             if p1r >= basecache[1]:
                                 d = builddelta(p1r)
                             elif p2r >= basecache[1]:
                                 d = builddelta(p2r)
                             else:
                                 d = builddelta(prev)
                         else:
                             d = builddelta(prev)
                         dist, l, data, base, chainbase = d
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if text is None:
                         textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),
                                                     cachedelta[1])
                     else:
                         textlen = len(text)
                     if d is None or dist > textlen * 2:
                         text = buildtext()
                         data = compress(text)
                         l = len(data[1]) + len(data[0])
                         base = chainbase = curr
                     e = (offset_type(offset, flags), l, textlen,
                          base, link, p1r, p2r, node)
                     self.index.insert(-1, e)
                     self.nodemap[node] = curr
                     entry = self._io.packentry(e, self.node, self.version, curr)
                     if not self._inline:
                         transaction.add(self.datafile, offset)
                         transaction.add(self.indexfile, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         dfh.flush()
                         ifh.write(entry)
                     else:
                         offset += curr * self._io.size
                         transaction.add(self.indexfile, offset, curr)
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                         self.checkinlinesize(transaction, ifh)
                     if type(text) == str: # only accept immutable objects
                         self._cache = (node, curr, text)
                     self._basecache = (curr, chainbase)
                     return node
                 def group(self, nodelist, bundler, reorder=None):
                     """Calculate a delta group, yielding a sequence of changegroup chunks
                     (strings).
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. The first delta is
                     first parent(nodelist[0]) -> nodelist[0], the receiver is
                     guaranteed to have this parent as it has all history before
                     these changesets. In the case firstparent is nullrev the
                     changegroup starts with a full revision.
                     """
+                    # if we don't have any revisions touched by these changesets, bail
+                    if len(nodelist) == 0:
+                        yield bundler.close()
+                        return
                     # for generaldelta revlogs, we linearize the revs; this will both be
                     # much quicker and generate a much smaller bundle
                     if (self._generaldelta and reorder is not False) or reorder:
                         dag = dagutil.revlogdag(self)
                         revs = set(self.rev(n) for n in nodelist)
                         revs = dag.linearize(revs)
                     else:
                         revs = sorted([self.rev(n) for n in nodelist])
-                    # if we don't have any revisions touched by these changesets, bail
-                    if not revs:
-                        yield bundler.close()
-                        return
                     # add the parent of the first rev
                     p = self.parentrevs(revs[0])[0]
                     revs.insert(0, p)
                     # build deltas
                     for r in xrange(len(revs) - 1):
                         prev, curr = revs[r], revs[r + 1]
                         for c in bundler.revchunk(self, curr, prev):
                             yield c
                     yield bundler.close()
                 def addgroup(self, bundle, linkmapper, transaction):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     """
                     # track the base of the current delta log
                     node = None
                     r = len(self)
                     end = 0
                     if r:
                         end = self.end(r - 1)
                     ifh = self.opener(self.indexfile, "a+")
                     isize = r * self._io.size
                     if self._inline:
                         transaction.add(self.indexfile, end + isize, r)
                         dfh = None
                     else:
                         transaction.add(self.indexfile, isize, r)
                         transaction.add(self.datafile, end)
                         dfh = self.opener(self.datafile, "a")
                     try:
                         # loop through our set of deltas
                         chain = None
                         while True:
                             chunkdata = bundle.deltachunk(chain)
                             if not chunkdata:
                                 break
                             node = chunkdata['node']
                             p1 = chunkdata['p1']
                             p2 = chunkdata['p2']
                             cs = chunkdata['cs']
                             deltabase = chunkdata['deltabase']
                             delta = chunkdata['delta']
                             link = linkmapper(cs)
                             if node in self.nodemap:
                                 # this can happen if two branches make the same change
                                 chain = node
                                 continue
                             for p in (p1, p2):
                                 if not p in self.nodemap:
                                     raise LookupError(p, self.indexfile,
                                                       _('unknown parent'))
                             if deltabase not in self.nodemap:
                                 raise LookupError(deltabase, self.indexfile,
                                                   _('unknown delta base'))
                             baserev = self.rev(deltabase)
                             chain = self._addrevision(node, None, transaction, link,
                                                       p1, p2, (baserev, delta), ifh, dfh)
                             if not dfh and not self._inline:
                                 # addrevision switched from inline to conventional
                                 # reopen the index
                                 ifh.close()
                                 dfh = self.opener(self.datafile, "a")
                                 ifh = self.opener(self.indexfile, "a")
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                     return node
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll readd them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     for rev in self:
                         if self.index[rev][4] >= minlink:
                             break
                     else:
                         return
                     # first truncate the files on disk
                     end = self.start(rev)
                     if not self._inline:
                         transaction.add(self.datafile, end)
                         end = rev * self._io.size
                     else:
                         end += rev * self._io.size
                     transaction.add(self.indexfile, end)
                     # then reset internal state in memory to forget those revisions
                     self._cache = None
                     self._chunkclear()
                     for x in xrange(rev, len(self)):
                         del self.nodemap[self.node(x)]
                     del self.index[rev:-1]
                 def checksize(self):
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         f = self.opener(self.datafile)
                         f.seek(0, 2)
                         actual = f.tell()
                         f.close()
                         dd = actual - expected
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         dd = 0
                     try:
                         f = self.opener(self.indexfile)
                         f.seek(0, 2)
                         actual = f.tell()
                         f.close()
                         s = self._io.size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         di = 0
                     return (dd, di)
                 def files(self):
                     res = [self.indexfile]
                     if not self._inline:
                         res.append(self.datafile)
                     return res