upstream/mercurial-mirror Commit - r14219:c3342708

1

# revlog.py - storage back-end for mercurial

1

# revlog.py - storage back-end for mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

"""Storage back-end for Mercurial.

8

"""Storage back-end for Mercurial.

9

10

This provides efficient delta storage with O(1) retrieve and append

10

This provides efficient delta storage with O(1) retrieve and append

11

and O(changes) merge between branches.

11

and O(changes) merge between branches.

12

"""

12

"""

13

14

# import stuff from node for others to import from revlog

14

# import stuff from node for others to import from revlog

15

from node import bin, hex, nullid, nullrev, short #@UnusedImport

15

from node import bin, hex, nullid, nullrev, short #@UnusedImport

16

from i18n import _

16

from i18n import _

17

import ancestor, mdiff, parsers, error, util

17

import ancestor, mdiff, parsers, error, util

18

import struct, zlib, errno

18

import struct, zlib, errno

19

20

_pack = struct.pack

20

_pack = struct.pack

21

_unpack = struct.unpack

21

_unpack = struct.unpack

22

_compress = zlib.compress

22

_compress = zlib.compress

23

_decompress = zlib.decompress

23

_decompress = zlib.decompress

24

_sha = util.sha1

24

_sha = util.sha1

25

26

# revlog header flags

26

# revlog header flags

27

REVLOGV0 = 0

27

REVLOGV0 = 0

28

REVLOGNG = 1

28

REVLOGNG = 1

29

REVLOGNGINLINEDATA = (1 << 16)

29

REVLOGNGINLINEDATA = (1 << 16)

30

REVLOGSHALLOW = (1 << 17)

30

REVLOGSHALLOW = (1 << 17)

31

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

31

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

32

REVLOG_DEFAULT_FORMAT = REVLOGNG

32

REVLOG_DEFAULT_FORMAT = REVLOGNG

33

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

33

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

34

REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGSHALLOW

34

REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGSHALLOW

35

36

# revlog index flags

36

# revlog index flags

37

REVIDX_KNOWN_FLAGS = 0

37

REVIDX_KNOWN_FLAGS = 0

38

39

# max size of revlog with inline data

39

# max size of revlog with inline data

40

_maxinline = 131072

40

_maxinline = 131072

41

_chunksize = 1048576

41

_chunksize = 1048576

42

43

RevlogError = error.RevlogError

43

RevlogError = error.RevlogError

44

LookupError = error.LookupError

44

LookupError = error.LookupError

45

46

def getoffset(q):

46

def getoffset(q):

47

return int(q >> 16)

47

return int(q >> 16)

48

49

def gettype(q):

49

def gettype(q):

50

return int(q & 0xFFFF)

50

return int(q & 0xFFFF)

51

52

def offset_type(offset, type):

52

def offset_type(offset, type):

53

return long(long(offset) << 16 | type)

53

return long(long(offset) << 16 | type)

54

55

nullhash = _sha(nullid)

55

nullhash = _sha(nullid)

56

57

def hash(text, p1, p2):

57

def hash(text, p1, p2):

58

"""generate a hash from the given text and its parent hashes

58

"""generate a hash from the given text and its parent hashes

59

60

This hash combines both the current file contents and its history

60

This hash combines both the current file contents and its history

61

in a manner that makes it easy to distinguish nodes with the same

61

in a manner that makes it easy to distinguish nodes with the same

62

content in the revision graph.

62

content in the revision graph.

63

"""

63

"""

64

# As of now, if one of the parent node is null, p2 is null

64

# As of now, if one of the parent node is null, p2 is null

65

if p2 == nullid:

65

if p2 == nullid:

66

# deep copy of a hash is faster than creating one

66

# deep copy of a hash is faster than creating one

67

s = nullhash.copy()

67

s = nullhash.copy()

68

s.update(p1)

68

s.update(p1)

69

else:

69

else:

70

# none of the parent nodes are nullid

70

# none of the parent nodes are nullid

71

l = [p1, p2]

71

l = [p1, p2]

72

l.sort()

72

l.sort()

73

s = _sha(l[0])

73

s = _sha(l[0])

74

s.update(l[1])

74

s.update(l[1])

75

s.update(text)

75

s.update(text)

76

return s.digest()

76

return s.digest()

77

78

def compress(text):

78

def compress(text):

79

""" generate a possibly-compressed representation of text """

79

""" generate a possibly-compressed representation of text """

80

if not text:

80

if not text:

81

return ("", text)

81

return ("", text)

82

l = len(text)

82

l = len(text)

83

bin = None

83

bin = None

84

if l < 44:

84

if l < 44:

85

pass

85

pass

86

elif l > 1000000:

86

elif l > 1000000:

87

# zlib makes an internal copy, thus doubling memory usage for

87

# zlib makes an internal copy, thus doubling memory usage for

88

# large files, so lets do this in pieces

88

# large files, so lets do this in pieces

89

z = zlib.compressobj()

89

z = zlib.compressobj()

90

p = []

90

p = []

91

pos = 0

91

pos = 0

92

while pos < l:

92

while pos < l:

93

pos2 = pos + 2**20

93

pos2 = pos + 2**20

94

p.append(z.compress(text[pos:pos2]))

94

p.append(z.compress(text[pos:pos2]))

95

pos = pos2

95

pos = pos2

96

p.append(z.flush())

96

p.append(z.flush())

97

if sum(map(len, p)) < l:

97

if sum(map(len, p)) < l:

98

bin = "".join(p)

98

bin = "".join(p)

99

else:

99

else:

100

bin = _compress(text)

100

bin = _compress(text)

101

if bin is None or len(bin) > l:

101

if bin is None or len(bin) > l:

102

if text[0] == '\0':

102

if text[0] == '\0':

103

return ("", text)

103

return ("", text)

104

return ('u', text)

104

return ('u', text)

105

return ("", bin)

105

return ("", bin)

106

107

def decompress(bin):

107

def decompress(bin):

108

""" decompress the given input """

108

""" decompress the given input """

109

if not bin:

109

if not bin:

110

return bin

110

return bin

111

t = bin[0]

111

t = bin[0]

112

if t == '\0':

112

if t == '\0':

113

return bin

113

return bin

114

if t == 'x':

114

if t == 'x':

115

return _decompress(bin)

115

return _decompress(bin)

116

if t == 'u':

116

if t == 'u':

117

return bin[1:]

117

return bin[1:]

118

raise RevlogError(_("unknown compression type %r") % t)

118

raise RevlogError(_("unknown compression type %r") % t)

119

120

indexformatv0 = ">4l20s20s20s"

120

indexformatv0 = ">4l20s20s20s"

121

v0shaoffset = 56

121

v0shaoffset = 56

122

123

class revlogoldio(object):

123

class revlogoldio(object):

124

def __init__(self):

124

def __init__(self):

125

self.size = struct.calcsize(indexformatv0)

125

self.size = struct.calcsize(indexformatv0)

126

127

def parseindex(self, data, inline):

127

def parseindex(self, data, inline):

128

s = self.size

128

s = self.size

129

index = []

129

index = []

130

nodemap = {nullid: nullrev}

130

nodemap = {nullid: nullrev}

131

n = off = 0

131

n = off = 0

132

l = len(data)

132

l = len(data)

133

while off + s <= l:

133

while off + s <= l:

134

cur = data[off:off + s]

134

cur = data[off:off + s]

135

off += s

135

off += s

136

e = _unpack(indexformatv0, cur)

136

e = _unpack(indexformatv0, cur)

137

# transform to revlogv1 format

137

# transform to revlogv1 format

138

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

138

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

139

nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])

139

nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])

140

index.append(e2)

140

index.append(e2)

141

nodemap[e[6]] = n

141

nodemap[e[6]] = n

142

n += 1

142

n += 1

143

144

# add the magic null revision at -1

144

# add the magic null revision at -1

145

index.append((0, 0, 0, -1, -1, -1, -1, nullid))

145

index.append((0, 0, 0, -1, -1, -1, -1, nullid))

146

147

return index, nodemap, None

147

return index, nodemap, None

148

149

def packentry(self, entry, node, version, rev):

149

def packentry(self, entry, node, version, rev):

150

if gettype(entry[0]):

150

if gettype(entry[0]):

151

raise RevlogError(_("index entry flags need RevlogNG"))

151

raise RevlogError(_("index entry flags need RevlogNG"))

152

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

152

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

153

node(entry[5]), node(entry[6]), entry[7])

153

node(entry[5]), node(entry[6]), entry[7])

154

return _pack(indexformatv0, *e2)

154

return _pack(indexformatv0, *e2)

155

156

# index ng:

156

# index ng:

157

# 6 bytes: offset

157

# 6 bytes: offset

158

# 2 bytes: flags

158

# 2 bytes: flags

159

# 4 bytes: compressed length

159

# 4 bytes: compressed length

160

# 4 bytes: uncompressed length

160

# 4 bytes: uncompressed length

161

# 4 bytes: base rev

161

# 4 bytes: base rev

162

# 4 bytes: link rev

162

# 4 bytes: link rev

163

# 4 bytes: parent 1 rev

163

# 4 bytes: parent 1 rev

164

# 4 bytes: parent 2 rev

164

# 4 bytes: parent 2 rev

165

# 32 bytes: nodeid

165

# 32 bytes: nodeid

166

indexformatng = ">Qiiiiii20s12x"

166

indexformatng = ">Qiiiiii20s12x"

167

ngshaoffset = 32

167

ngshaoffset = 32

168

versionformat = ">I"

168

versionformat = ">I"

169

170

class revlogio(object):

170

class revlogio(object):

171

def __init__(self):

171

def __init__(self):

172

self.size = struct.calcsize(indexformatng)

172

self.size = struct.calcsize(indexformatng)

173

174

def parseindex(self, data, inline):

174

def parseindex(self, data, inline):

175

# call the C implementation to parse the index data

175

# call the C implementation to parse the index data

176

index, cache = parsers.parse_index2(data, inline)

176

index, cache = parsers.parse_index2(data, inline)

177

return index, None, cache

177

return index, None, cache

178

179

def packentry(self, entry, node, version, rev):

179

def packentry(self, entry, node, version, rev):

180

p = _pack(indexformatng, *entry)

180

p = _pack(indexformatng, *entry)

181

if rev == 0:

181

if rev == 0:

182

p = _pack(versionformat, version) + p[4:]

182

p = _pack(versionformat, version) + p[4:]

183

return p

183

return p

184

185

class revlog(object):

185

class revlog(object):

186

"""

186

"""

187

the underlying revision storage object

187

the underlying revision storage object

188

189

A revlog consists of two parts, an index and the revision data.

189

A revlog consists of two parts, an index and the revision data.

190

191

The index is a file with a fixed record size containing

191

The index is a file with a fixed record size containing

192

information on each revision, including its nodeid (hash), the

192

information on each revision, including its nodeid (hash), the

193

nodeids of its parents, the position and offset of its data within

193

nodeids of its parents, the position and offset of its data within

194

the data file, and the revision it's based on. Finally, each entry

194

the data file, and the revision it's based on. Finally, each entry

195

contains a linkrev entry that can serve as a pointer to external

195

contains a linkrev entry that can serve as a pointer to external

196

data.

196

data.

197

198

The revision data itself is a linear collection of data chunks.

198

The revision data itself is a linear collection of data chunks.

199

Each chunk represents a revision and is usually represented as a

199

Each chunk represents a revision and is usually represented as a

200

delta against the previous chunk. To bound lookup time, runs of

200

delta against the previous chunk. To bound lookup time, runs of

201

deltas are limited to about 2 times the length of the original

201

deltas are limited to about 2 times the length of the original

202

version data. This makes retrieval of a version proportional to

202

version data. This makes retrieval of a version proportional to

203

its size, or O(1) relative to the number of revisions.

203

its size, or O(1) relative to the number of revisions.

204

205

Both pieces of the revlog are written to in an append-only

205

Both pieces of the revlog are written to in an append-only

206

fashion, which means we never need to rewrite a file to insert or

206

fashion, which means we never need to rewrite a file to insert or

207

remove data, and can use some simple techniques to avoid the need

207

remove data, and can use some simple techniques to avoid the need

208

for locking while reading.

208

for locking while reading.

209

"""

209

"""

210

def __init__(self, opener, indexfile, shallowroot=None):

210

def __init__(self, opener, indexfile, shallowroot=None):

211

"""

211

"""

212

create a revlog object

212

create a revlog object

213

214

opener is a function that abstracts the file opening operation

214

opener is a function that abstracts the file opening operation

215

and can be used to implement COW semantics or the like.

215

and can be used to implement COW semantics or the like.

216

"""

216

"""

217

self.indexfile = indexfile

217

self.indexfile = indexfile

218

self.datafile = indexfile[:-2] + ".d"

218

self.datafile = indexfile[:-2] + ".d"

219

self.opener = opener

219

self.opener = opener

220

self._cache = None

220

self._cache = None

221

self._chunkcache = (0, '')

221

self._chunkcache = (0, '')

222

self.index = []

222

self.index = []

223

self._shallowroot = shallowroot

223

self._shallowroot = shallowroot

224

self._pcache = {}

224

self._pcache = {}

225

self._nodecache = {nullid: nullrev}

225

self._nodecache = {nullid: nullrev}

226

self._nodepos = None

226

self._nodepos = None

227

228

v = REVLOG_DEFAULT_VERSION

228

v = REVLOG_DEFAULT_VERSION

229

if hasattr(opener, 'options') and 'defversion' in opener.options:

229

if hasattr(opener, 'options') and 'defversion' in opener.options:

230

v = opener.options['defversion']

230

v = opener.options['defversion']

231

if v & REVLOGNG:

231

if v & REVLOGNG:

232

v |= REVLOGNGINLINEDATA

232

v |= REVLOGNGINLINEDATA

233

234

if shallowroot:

234

if shallowroot:

235

v |= REVLOGSHALLOW

235

v |= REVLOGSHALLOW

236

237

i = ''

237

i = ''

238

try:

238

try:

239

f = self.opener(self.indexfile)

239

f = self.opener(self.indexfile)

240

i = f.read()

240

i = f.read()

241

f.close()

241

f.close()

242

if len(i) > 0:

242

if len(i) > 0:

243

v = struct.unpack(versionformat, i[:4])[0]

243

v = struct.unpack(versionformat, i[:4])[0]

244

except IOError, inst:

244

except IOError, inst:

245

if inst.errno != errno.ENOENT:

245

if inst.errno != errno.ENOENT:

246

raise

246

raise

247

248

self.version = v

248

self.version = v

249

self._inline = v & REVLOGNGINLINEDATA

249

self._inline = v & REVLOGNGINLINEDATA

250

self._shallow = v & REVLOGSHALLOW

250

self._shallow = v & REVLOGSHALLOW

251

flags = v & ~0xFFFF

251

flags = v & ~0xFFFF

252

fmt = v & 0xFFFF

252

fmt = v & 0xFFFF

253

if fmt == REVLOGV0 and flags:

253

if fmt == REVLOGV0 and flags:

254

raise RevlogError(_("index %s unknown flags %#04x for format v0")

254

raise RevlogError(_("index %s unknown flags %#04x for format v0")

255

% (self.indexfile, flags >> 16))

255

% (self.indexfile, flags >> 16))

256

elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:

256

elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:

257

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

257

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

258

% (self.indexfile, flags >> 16))

258

% (self.indexfile, flags >> 16))

259

elif fmt > REVLOGNG:

259

elif fmt > REVLOGNG:

260

raise RevlogError(_("index %s unknown format %d")

260

raise RevlogError(_("index %s unknown format %d")

261

% (self.indexfile, fmt))

261

% (self.indexfile, fmt))

262

263

self._io = revlogio()

263

self._io = revlogio()

264

if self.version == REVLOGV0:

264

if self.version == REVLOGV0:

265

self._io = revlogoldio()

265

self._io = revlogoldio()

266

try:

266

try:

267

d = self._io.parseindex(i, self._inline)

267

d = self._io.parseindex(i, self._inline)

268

except (ValueError, IndexError):

268

except (ValueError, IndexError):

269

raise RevlogError(_("index %s is corrupted") % (self.indexfile))

269

raise RevlogError(_("index %s is corrupted") % (self.indexfile))

270

self.index, nodemap, self._chunkcache = d

270

self.index, nodemap, self._chunkcache = d

271

if nodemap is not None:

271

if nodemap is not None:

272

self.nodemap = self._nodecache = nodemap

272

self.nodemap = self._nodecache = nodemap

273

if not self._chunkcache:

273

if not self._chunkcache:

274

self._chunkclear()

274

self._chunkclear()

275

276

def tip(self):

276

def tip(self):

277

return self.node(len(self.index) - 2)

277

return self.node(len(self.index) - 2)

278

def __len__(self):

278

def __len__(self):

279

return len(self.index) - 1

279

return len(self.index) - 1

280

def __iter__(self):

280

def __iter__(self):

281

for i in xrange(len(self)):

281

for i in xrange(len(self)):

282

yield i

282

yield i

283

284

@util.propertycache

284

@util.propertycache

285

def nodemap(self):

285

def nodemap(self):

286

self.rev(self.node(0))

286

self.rev(self.node(0))

287

return self._nodecache

287

return self._nodecache

288

289

def rev(self, node):

289

def rev(self, node):

290

try:

290

try:

291

return self._nodecache[node]

291

return self._nodecache[node]

292

except KeyError:

292

except KeyError:

293

n = self._nodecache

293

n = self._nodecache

294

i = self.index

294

i = self.index

295

p = self._nodepos

295

p = self._nodepos

296

if p is None:

296

if p is None:

297

p = len(i) - 2

297

p = len(i) - 2

298

for r in xrange(p, -1, -1):

298

for r in xrange(p, -1, -1):

299

v = i[r][7]

299

v = i[r][7]

300

n[v] = r

300

n[v] = r

301

if v == node:

301

if v == node:

302

self._nodepos = r - 1

302

self._nodepos = r - 1

303

return r

303

return r

304

raise LookupError(node, self.indexfile, _('no node'))

304

raise LookupError(node, self.indexfile, _('no node'))

305

306

def node(self, rev):

306

def node(self, rev):

307

return self.index[rev][7]

307

return self.index[rev][7]

308

def linkrev(self, rev):

308

def linkrev(self, rev):

309

return self.index[rev][4]

309

return self.index[rev][4]

310

def parents(self, node):

310

def parents(self, node):

311

i = self.index

311

i = self.index

312

d = i[self.rev(node)]

312

d = i[self.rev(node)]

313

return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline

313

return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline

314

def parentrevs(self, rev):

314

def parentrevs(self, rev):

315

return self.index[rev][5:7]

315

return self.index[rev][5:7]

316

def start(self, rev):

316

def start(self, rev):

317

return int(self.index[rev][0] >> 16)

317

return int(self.index[rev][0] >> 16)

318

def end(self, rev):

318

def end(self, rev):

319

return self.start(rev) + self.length(rev)

319

return self.start(rev) + self.length(rev)

320

def length(self, rev):

320

def length(self, rev):

321

return self.index[rev][1]

321

return self.index[rev][1]

322

def base(self, rev):

322

def base(self, rev):

323

return self.index[rev][3]

323

return self.index[rev][3]

324

def flags(self, rev):

324

def flags(self, rev):

325

return self.index[rev][0] & 0xFFFF

325

return self.index[rev][0] & 0xFFFF

326

def rawsize(self, rev):

326

def rawsize(self, rev):

327

"""return the length of the uncompressed text for a given revision"""

327

"""return the length of the uncompressed text for a given revision"""

328

l = self.index[rev][2]

328

l = self.index[rev][2]

329

if l >= 0:

329

if l >= 0:

330

return l

330

return l

331

332

t = self.revision(self.node(rev))

332

t = self.revision(self.node(rev))

333

return len(t)

333

return len(t)

334

size = rawsize

334

size = rawsize

335

336

def reachable(self, node, stop=None):

336

def reachable(self, node, stop=None):

337

"""return the set of all nodes ancestral to a given node, including

337

"""return the set of all nodes ancestral to a given node, including

338

the node itself, stopping when stop is matched"""

338

the node itself, stopping when stop is matched"""

339

reachable = set((node,))

339

reachable = set((node,))

340

visit = [node]

340

visit = [node]

341

if stop:

341

if stop:

342

stopn = self.rev(stop)

342

stopn = self.rev(stop)

343

else:

343

else:

344

stopn = 0

344

stopn = 0

345

while visit:

345

while visit:

346

n = visit.pop(0)

346

n = visit.pop(0)

347

if n == stop:

347

if n == stop:

348

continue

348

continue

349

if n == nullid:

349

if n == nullid:

350

continue

350

continue

351

for p in self.parents(n):

351

for p in self.parents(n):

352

if self.rev(p) < stopn:

352

if self.rev(p) < stopn:

353

continue

353

continue

354

if p not in reachable:

354

if p not in reachable:

355

reachable.add(p)

355

reachable.add(p)

356

visit.append(p)

356

visit.append(p)

357

return reachable

357

return reachable

358

359

def ancestors(self, *revs):

359

def ancestors(self, *revs):

360

"""Generate the ancestors of 'revs' in reverse topological order.

360

"""Generate the ancestors of 'revs' in reverse topological order.

361

362

Yield a sequence of revision numbers starting with the parents

362

Yield a sequence of revision numbers starting with the parents

363

of each revision in revs, i.e., each revision is *not* considered

363

of each revision in revs, i.e., each revision is *not* considered

364

an ancestor of itself. Results are in breadth-first order:

364

an ancestor of itself. Results are in breadth-first order:

365

parents of each rev in revs, then parents of those, etc. Result

365

parents of each rev in revs, then parents of those, etc. Result

366

does not include the null revision."""

366

does not include the null revision."""

367

visit = list(revs)

367

visit = list(revs)

368

seen = set([nullrev])

368

seen = set([nullrev])

369

while visit:

369

while visit:

370

for parent in self.parentrevs(visit.pop(0)):

370

for parent in self.parentrevs(visit.pop(0)):

371

if parent not in seen:

371

if parent not in seen:

372

visit.append(parent)

372

visit.append(parent)

373

seen.add(parent)

373

seen.add(parent)

374

yield parent

374

yield parent

375

376

def descendants(self, *revs):

376

def descendants(self, *revs):

377

"""Generate the descendants of 'revs' in revision order.

377

"""Generate the descendants of 'revs' in revision order.

378

379

Yield a sequence of revision numbers starting with a child of

379

Yield a sequence of revision numbers starting with a child of

380

some rev in revs, i.e., each revision is *not* considered a

380

some rev in revs, i.e., each revision is *not* considered a

381

descendant of itself. Results are ordered by revision number (a

381

descendant of itself. Results are ordered by revision number (a

382

topological sort)."""

382

topological sort)."""

383

first = min(revs)

383

first = min(revs)

384

if first == nullrev:

384

if first == nullrev:

385

for i in self:

385

for i in self:

386

yield i

386

yield i

387

return

387

return

388

389

seen = set(revs)

389

seen = set(revs)

390

for i in xrange(first + 1, len(self)):

390

for i in xrange(first + 1, len(self)):

391

for x in self.parentrevs(i):

391

for x in self.parentrevs(i):

392

if x != nullrev and x in seen:

392

if x != nullrev and x in seen:

393

seen.add(i)

393

seen.add(i)

394

yield i

394

yield i

395

break

395

break

396

397

def findcommonmissing(self, common=None, heads=None):

397

def findcommonmissing(self, common=None, heads=None):

398

"""Return a tuple of the ancestors of common and the ancestors of heads

398

"""Return a tuple of the ancestors of common and the ancestors of heads

399

that are not ancestors of common.

399

that are not ancestors of common.

400

401

More specifically, the second element is a list of nodes N such that

401

More specifically, the second element is a list of nodes N such that

402

every N satisfies the following constraints:

402

every N satisfies the following constraints:

403

404

1. N is an ancestor of some node in 'heads'

404

1. N is an ancestor of some node in 'heads'

405

2. N is not an ancestor of any node in 'common'

405

2. N is not an ancestor of any node in 'common'

406

407

The list is sorted by revision number, meaning it is

407

The list is sorted by revision number, meaning it is

408

topologically sorted.

408

topologically sorted.

409

410

'heads' and 'common' are both lists of node IDs. If heads is

410

'heads' and 'common' are both lists of node IDs. If heads is

411

not supplied, uses all of the revlog's heads. If common is not

411

not supplied, uses all of the revlog's heads. If common is not

412

supplied, uses nullid."""

412

supplied, uses nullid."""

413

if common is None:

413

if common is None:

414

common = [nullid]

414

common = [nullid]

415

if heads is None:

415

if heads is None:

416

heads = self.heads()

416

heads = self.heads()

417

418

common = [self.rev(n) for n in common]

418

common = [self.rev(n) for n in common]

419

heads = [self.rev(n) for n in heads]

419

heads = [self.rev(n) for n in heads]

420

421

# we want the ancestors, but inclusive

421

# we want the ancestors, but inclusive

422

has = set(self.ancestors(*common))

422

has = set(self.ancestors(*common))

423

has.add(nullrev)

423

has.add(nullrev)

424

has.update(common)

424

has.update(common)

425

426

# take all ancestors from heads that aren't in has

426

# take all ancestors from heads that aren't in has

427

missing = set()

427

missing = set()

428

visit = [r for r in heads if r not in has]

428

visit = [r for r in heads if r not in has]

429

while visit:

429

while visit:

430

r = visit.pop(0)

430

r = visit.pop(0)

431

if r in missing:

431

if r in missing:

432

continue

432

continue

433

else:

433

else:

434

missing.add(r)

434

missing.add(r)

435

for p in self.parentrevs(r):

435

for p in self.parentrevs(r):

436

if p not in has:

436

if p not in has:

437

visit.append(p)

437

visit.append(p)

438

missing = list(missing)

438

missing = list(missing)

439

missing.sort()

439

missing.sort()

440

return has, [self.node(r) for r in missing]

440

return has, [self.node(r) for r in missing]

441

442

def findmissing(self, common=None, heads=None):

442

def findmissing(self, common=None, heads=None):

443

"""Return the ancestors of heads that are not ancestors of common.

443

"""Return the ancestors of heads that are not ancestors of common.

444

445

More specifically, return a list of nodes N such that every N

445

More specifically, return a list of nodes N such that every N

446

satisfies the following constraints:

446

satisfies the following constraints:

447

448

1. N is an ancestor of some node in 'heads'

448

1. N is an ancestor of some node in 'heads'

449

2. N is not an ancestor of any node in 'common'

449

2. N is not an ancestor of any node in 'common'

450

451

The list is sorted by revision number, meaning it is

451

The list is sorted by revision number, meaning it is

452

topologically sorted.

452

topologically sorted.

453

454

'heads' and 'common' are both lists of node IDs. If heads is

454

'heads' and 'common' are both lists of node IDs. If heads is

455

not supplied, uses all of the revlog's heads. If common is not

455

not supplied, uses all of the revlog's heads. If common is not

456

supplied, uses nullid."""

456

supplied, uses nullid."""

457

_common, missing = self.findcommonmissing(common, heads)

457

_common, missing = self.findcommonmissing(common, heads)

458

return missing

458

return missing

459

460

def nodesbetween(self, roots=None, heads=None):

460

def nodesbetween(self, roots=None, heads=None):

461

"""Return a topological path from 'roots' to 'heads'.

461

"""Return a topological path from 'roots' to 'heads'.

462

463

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

463

Return a tuple (nodes, outroots, outheads) where 'nodes' is a

464

topologically sorted list of all nodes N that satisfy both of

464

topologically sorted list of all nodes N that satisfy both of

465

these constraints:

465

these constraints:

466

467

1. N is a descendant of some node in 'roots'

467

1. N is a descendant of some node in 'roots'

468

2. N is an ancestor of some node in 'heads'

468

2. N is an ancestor of some node in 'heads'

469

470

Every node is considered to be both a descendant and an ancestor

470

Every node is considered to be both a descendant and an ancestor

471

of itself, so every reachable node in 'roots' and 'heads' will be

471

of itself, so every reachable node in 'roots' and 'heads' will be

472

included in 'nodes'.

472

included in 'nodes'.

473

474

'outroots' is the list of reachable nodes in 'roots', i.e., the

474

'outroots' is the list of reachable nodes in 'roots', i.e., the

475

subset of 'roots' that is returned in 'nodes'. Likewise,

475

subset of 'roots' that is returned in 'nodes'. Likewise,

476

'outheads' is the subset of 'heads' that is also in 'nodes'.

476

'outheads' is the subset of 'heads' that is also in 'nodes'.

477

478

'roots' and 'heads' are both lists of node IDs. If 'roots' is

478

'roots' and 'heads' are both lists of node IDs. If 'roots' is

479

unspecified, uses nullid as the only root. If 'heads' is

479

unspecified, uses nullid as the only root. If 'heads' is

480

unspecified, uses list of all of the revlog's heads."""

480

unspecified, uses list of all of the revlog's heads."""

481

nonodes = ([], [], [])

481

nonodes = ([], [], [])

482

if roots is not None:

482

if roots is not None:

483

roots = list(roots)

483

roots = list(roots)

484

if not roots:

484

if not roots:

485

return nonodes

485

return nonodes

486

lowestrev = min([self.rev(n) for n in roots])

486

lowestrev = min([self.rev(n) for n in roots])

487

else:

487

else:

488

roots = [nullid] # Everybody's a descendent of nullid

488

roots = [nullid] # Everybody's a descendent of nullid

489

lowestrev = nullrev

489

lowestrev = nullrev

490

if (lowestrev == nullrev) and (heads is None):

490

if (lowestrev == nullrev) and (heads is None):

491

# We want _all_ the nodes!

491

# We want _all_ the nodes!

492

return ([self.node(r) for r in self], [nullid], list(self.heads()))

492

return ([self.node(r) for r in self], [nullid], list(self.heads()))

493

if heads is None:

493

if heads is None:

494

# All nodes are ancestors, so the latest ancestor is the last

494

# All nodes are ancestors, so the latest ancestor is the last

495

# node.

495

# node.

496

highestrev = len(self) - 1

496

highestrev = len(self) - 1

497

# Set ancestors to None to signal that every node is an ancestor.

497

# Set ancestors to None to signal that every node is an ancestor.

498

ancestors = None

498

ancestors = None

499

# Set heads to an empty dictionary for later discovery of heads

499

# Set heads to an empty dictionary for later discovery of heads

500

heads = {}

500

heads = {}

501

else:

501

else:

502

heads = list(heads)

502

heads = list(heads)

503

if not heads:

503

if not heads:

504

return nonodes

504

return nonodes

505

ancestors = set()

505

ancestors = set()

506

# Turn heads into a dictionary so we can remove 'fake' heads.

506

# Turn heads into a dictionary so we can remove 'fake' heads.

507

# Also, later we will be using it to filter out the heads we can't

507

# Also, later we will be using it to filter out the heads we can't

508

# find from roots.

508

# find from roots.

509

heads = dict.fromkeys(heads, 0)

509

heads = dict.fromkeys(heads, False)

510

# Start at the top and keep marking parents until we're done.

510

# Start at the top and keep marking parents until we're done.

511

nodestotag = set(heads)

511

nodestotag = set(heads)

512

# Remember where the top was so we can use it as a limit later.

512

# Remember where the top was so we can use it as a limit later.

513

highestrev = max([self.rev(n) for n in nodestotag])

513

highestrev = max([self.rev(n) for n in nodestotag])

514

while nodestotag:

514

while nodestotag:

515

# grab a node to tag

515

# grab a node to tag

516

n = nodestotag.pop()

516

n = nodestotag.pop()

517

# Never tag nullid

517

# Never tag nullid

518

if n == nullid:

518

if n == nullid:

519

continue

519

continue

520

# A node's revision number represents its place in a

520

# A node's revision number represents its place in a

521

# topologically sorted list of nodes.

521

# topologically sorted list of nodes.

522

r = self.rev(n)

522

r = self.rev(n)

523

if r >= lowestrev:

523

if r >= lowestrev:

524

if n not in ancestors:

524

if n not in ancestors:

525

# If we are possibly a descendent of one of the roots

525

# If we are possibly a descendent of one of the roots

526

# and we haven't already been marked as an ancestor

526

# and we haven't already been marked as an ancestor

527

ancestors.add(n) # Mark as ancestor

527

ancestors.add(n) # Mark as ancestor

528

# Add non-nullid parents to list of nodes to tag.

528

# Add non-nullid parents to list of nodes to tag.

529

nodestotag.update([p for p in self.parents(n) if

529

nodestotag.update([p for p in self.parents(n) if

530

p != nullid])

530

p != nullid])

531

elif n in heads: # We've seen it before, is it a fake head?

531

elif n in heads: # We've seen it before, is it a fake head?

532

# So it is, real heads should not be the ancestors of

532

# So it is, real heads should not be the ancestors of

533

# any other heads.

533

# any other heads.

534

heads.pop(n)

534

heads.pop(n)

535

if not ancestors:

535

if not ancestors:

536

return nonodes

536

return nonodes

537

# Now that we have our set of ancestors, we want to remove any

537

# Now that we have our set of ancestors, we want to remove any

538

# roots that are not ancestors.

538

# roots that are not ancestors.

539

540

# If one of the roots was nullid, everything is included anyway.

540

# If one of the roots was nullid, everything is included anyway.

541

if lowestrev > nullrev:

541

if lowestrev > nullrev:

542

# But, since we weren't, let's recompute the lowest rev to not

542

# But, since we weren't, let's recompute the lowest rev to not

543

# include roots that aren't ancestors.

543

# include roots that aren't ancestors.

544

545

# Filter out roots that aren't ancestors of heads

545

# Filter out roots that aren't ancestors of heads

546

roots = [n for n in roots if n in ancestors]

546

roots = [n for n in roots if n in ancestors]

547

# Recompute the lowest revision

547

# Recompute the lowest revision

548

if roots:

548

if roots:

549

lowestrev = min([self.rev(n) for n in roots])

549

lowestrev = min([self.rev(n) for n in roots])

550

else:

550

else:

551

# No more roots? Return empty list

551

# No more roots? Return empty list

552

return nonodes

552

return nonodes

553

else:

553

else:

554

# We are descending from nullid, and don't need to care about

554

# We are descending from nullid, and don't need to care about

555

# any other roots.

555

# any other roots.

556

lowestrev = nullrev

556

lowestrev = nullrev

557

roots = [nullid]

557

roots = [nullid]

558

# Transform our roots list into a set.

558

# Transform our roots list into a set.

559

descendents = set(roots)

559

descendents = set(roots)

560

# Also, keep the original roots so we can filter out roots that aren't

560

# Also, keep the original roots so we can filter out roots that aren't

561

# 'real' roots (i.e. are descended from other roots).

561

# 'real' roots (i.e. are descended from other roots).

562

roots = descendents.copy()

562

roots = descendents.copy()

563

# Our topologically sorted list of output nodes.

563

# Our topologically sorted list of output nodes.

564

orderedout = []

564

orderedout = []

565

# Don't start at nullid since we don't want nullid in our output list,

565

# Don't start at nullid since we don't want nullid in our output list,

566

# and if nullid shows up in descedents, empty parents will look like

566

# and if nullid shows up in descedents, empty parents will look like

567

# they're descendents.

567

# they're descendents.

568

for r in xrange(max(lowestrev, 0), highestrev + 1):

568

for r in xrange(max(lowestrev, 0), highestrev + 1):

569

n = self.node(r)

569

n = self.node(r)

570

isdescendent = False

570

isdescendent = False

571

if lowestrev == nullrev: # Everybody is a descendent of nullid

571

if lowestrev == nullrev: # Everybody is a descendent of nullid

572

isdescendent = True

572

isdescendent = True

573

elif n in descendents:

573

elif n in descendents:

574

# n is already a descendent

574

# n is already a descendent

575

isdescendent = True

575

isdescendent = True

576

# This check only needs to be done here because all the roots

576

# This check only needs to be done here because all the roots

577

# will start being marked is descendents before the loop.

577

# will start being marked is descendents before the loop.

578

if n in roots:

578

if n in roots:

579

# If n was a root, check if it's a 'real' root.

579

# If n was a root, check if it's a 'real' root.

580

p = tuple(self.parents(n))

580

p = tuple(self.parents(n))

581

# If any of its parents are descendents, it's not a root.

581

# If any of its parents are descendents, it's not a root.

582

if (p[0] in descendents) or (p[1] in descendents):

582

if (p[0] in descendents) or (p[1] in descendents):

583

roots.remove(n)

583

roots.remove(n)

584

else:

584

else:

585

p = tuple(self.parents(n))

585

p = tuple(self.parents(n))

586

# A node is a descendent if either of its parents are

586

# A node is a descendent if either of its parents are

587

# descendents. (We seeded the dependents list with the roots

587

# descendents. (We seeded the dependents list with the roots

588

# up there, remember?)

588

# up there, remember?)

589

if (p[0] in descendents) or (p[1] in descendents):

589

if (p[0] in descendents) or (p[1] in descendents):

590

descendents.add(n)

590

descendents.add(n)

591

isdescendent = True

591

isdescendent = True

592

if isdescendent and ((ancestors is None) or (n in ancestors)):

592

if isdescendent and ((ancestors is None) or (n in ancestors)):

593

# Only include nodes that are both descendents and ancestors.

593

# Only include nodes that are both descendents and ancestors.

594

orderedout.append(n)

594

orderedout.append(n)

595

if (ancestors is not None) and (n in heads):

595

if (ancestors is not None) and (n in heads):

596

# We're trying to figure out which heads are reachable

596

# We're trying to figure out which heads are reachable

597

# from roots.

597

# from roots.

598

# Mark this head as having been reached

598

# Mark this head as having been reached

599

heads[n] = 1

599

heads[n] = True

600

elif ancestors is None:

600

elif ancestors is None:

601

# Otherwise, we're trying to discover the heads.

601

# Otherwise, we're trying to discover the heads.

602

# Assume this is a head because if it isn't, the next step

602

# Assume this is a head because if it isn't, the next step

603

# will eventually remove it.

603

# will eventually remove it.

604

heads[n] = 1

604

heads[n] = True

605

# But, obviously its parents aren't.

605

# But, obviously its parents aren't.

606

for p in self.parents(n):

606

for p in self.parents(n):

607

heads.pop(p, None)

607

heads.pop(p, None)

608

heads = [n for n in heads.iter~~key~~s() if ~~heads~~[n] != 0]

608

heads = [n for n, flag in heads.iteritems() if flag]

609

roots = list(roots)

609

roots = list(roots)

610

assert orderedout

610

assert orderedout

611

assert roots

611

assert roots

612

assert heads

612

assert heads

613

return (orderedout, roots, heads)

613

return (orderedout, roots, heads)

614

615

def headrevs(self):

615

def headrevs(self):

616

count = len(self)

616

count = len(self)

617

if not count:

617

if not count:

618

return [nullrev]

618

return [nullrev]

619

ishead = [1] * (count + 1)

619

ishead = [1] * (count + 1)

620

index = self.index

620

index = self.index

621

for r in xrange(count):

621

for r in xrange(count):

622

e = index[r]

622

e = index[r]

623

ishead[e[5]] = ishead[e[6]] = 0

623

ishead[e[5]] = ishead[e[6]] = 0

624

return [r for r in xrange(count) if ishead[r]]

624

return [r for r in xrange(count) if ishead[r]]

625

626

def heads(self, start=None, stop=None):

626

def heads(self, start=None, stop=None):

627

"""return the list of all nodes that have no children

627

"""return the list of all nodes that have no children

628

629

if start is specified, only heads that are descendants of

629

if start is specified, only heads that are descendants of

630

start will be returned

630

start will be returned

631

if stop is specified, it will consider all the revs from stop

631

if stop is specified, it will consider all the revs from stop

632

as if they had no children

632

as if they had no children

633

"""

633

"""

634

if start is None and stop is None:

634

if start is None and stop is None:

635

if not len(self):

635

if not len(self):

636

return [nullid]

636

return [nullid]

637

return [self.node(r) for r in self.headrevs()]

637

return [self.node(r) for r in self.headrevs()]

638

639

if start is None:

639

if start is None:

640

start = nullid

640

start = nullid

641

if stop is None:

641

if stop is None:

642

stop = []

642

stop = []

643

stoprevs = set([self.rev(n) for n in stop])

643

stoprevs = set([self.rev(n) for n in stop])

644

startrev = self.rev(start)

644

startrev = self.rev(start)

645

reachable = set((startrev,))

645

reachable = set((startrev,))

646

heads = set((startrev,))

646

heads = set((startrev,))

647

648

parentrevs = self.parentrevs

648

parentrevs = self.parentrevs

649

for r in xrange(startrev + 1, len(self)):

649

for r in xrange(startrev + 1, len(self)):

650

for p in parentrevs(r):

650

for p in parentrevs(r):

651

if p in reachable:

651

if p in reachable:

652

if r not in stoprevs:

652

if r not in stoprevs:

653

reachable.add(r)

653

reachable.add(r)

654

heads.add(r)

654

heads.add(r)

655

if p in heads and p not in stoprevs:

655

if p in heads and p not in stoprevs:

656

heads.remove(p)

656

heads.remove(p)

657

658

return [self.node(r) for r in heads]

658

return [self.node(r) for r in heads]

659

660

def children(self, node):

660

def children(self, node):

661

"""find the children of a given node"""

661

"""find the children of a given node"""

662

c = []

662

c = []

663

p = self.rev(node)

663

p = self.rev(node)

664

for r in range(p + 1, len(self)):

664

for r in range(p + 1, len(self)):

665

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

665

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

666

if prevs:

666

if prevs:

667

for pr in prevs:

667

for pr in prevs:

668

if pr == p:

668

if pr == p:

669

c.append(self.node(r))

669

c.append(self.node(r))

670

elif p == nullrev:

670

elif p == nullrev:

671

c.append(self.node(r))

671

c.append(self.node(r))

672

return c

672

return c

673

674

def descendant(self, start, end):

674

def descendant(self, start, end):

675

if start == nullrev:

675

if start == nullrev:

676

return True

676

return True

677

for i in self.descendants(start):

677

for i in self.descendants(start):

678

if i == end:

678

if i == end:

679

return True

679

return True

680

elif i > end:

680

elif i > end:

681

break

681

break

682

return False

682

return False

683

684

def ancestor(self, a, b):

684

def ancestor(self, a, b):

685

"""calculate the least common ancestor of nodes a and b"""

685

"""calculate the least common ancestor of nodes a and b"""

686

687

# fast path, check if it is a descendant

687

# fast path, check if it is a descendant

688

a, b = self.rev(a), self.rev(b)

688

a, b = self.rev(a), self.rev(b)

689

start, end = sorted((a, b))

689

start, end = sorted((a, b))

690

if self.descendant(start, end):

690

if self.descendant(start, end):

691

return self.node(start)

691

return self.node(start)

692

693

def parents(rev):

693

def parents(rev):

694

return [p for p in self.parentrevs(rev) if p != nullrev]

694

return [p for p in self.parentrevs(rev) if p != nullrev]

695

696

c = ancestor.ancestor(a, b, parents)

696

c = ancestor.ancestor(a, b, parents)

697

if c is None:

697

if c is None:

698

return nullid

698

return nullid

699

700

return self.node(c)

700

return self.node(c)

701

702

def _match(self, id):

702

def _match(self, id):

703

if isinstance(id, (long, int)):

703

if isinstance(id, (long, int)):

704

# rev

704

# rev

705

return self.node(id)

705

return self.node(id)

706

if len(id) == 20:

706

if len(id) == 20:

707

# possibly a binary node

707

# possibly a binary node

708

# odds of a binary node being all hex in ASCII are 1 in 10**25

708

# odds of a binary node being all hex in ASCII are 1 in 10**25

709

try:

709

try:

710

node = id

710

node = id

711

self.rev(node) # quick search the index

711

self.rev(node) # quick search the index

712

return node

712

return node

713

except LookupError:

713

except LookupError:

714

pass # may be partial hex id

714

pass # may be partial hex id

715

try:

715

try:

716

# str(rev)

716

# str(rev)

717

rev = int(id)

717

rev = int(id)

718

if str(rev) != id:

718

if str(rev) != id:

719

raise ValueError

719

raise ValueError

720

if rev < 0:

720

if rev < 0:

721

rev = len(self) + rev

721

rev = len(self) + rev

722

if rev < 0 or rev >= len(self):

722

if rev < 0 or rev >= len(self):

723

raise ValueError

723

raise ValueError

724

return self.node(rev)

724

return self.node(rev)

725

except (ValueError, OverflowError):

725

except (ValueError, OverflowError):

726

pass

726

pass

727

if len(id) == 40:

727

if len(id) == 40:

728

try:

728

try:

729

# a full hex nodeid?

729

# a full hex nodeid?

730

node = bin(id)

730

node = bin(id)

731

self.rev(node)

731

self.rev(node)

732

return node

732

return node

733

except (TypeError, LookupError):

733

except (TypeError, LookupError):

734

pass

734

pass

735

736

def _partialmatch(self, id):

736

def _partialmatch(self, id):

737

if id in self._pcache:

737

if id in self._pcache:

738

return self._pcache[id]

738

return self._pcache[id]

739

740

if len(id) < 40:

740

if len(id) < 40:

741

try:

741

try:

742

# hex(node)[:...]

742

# hex(node)[:...]

743

l = len(id) // 2 # grab an even number of digits

743

l = len(id) // 2 # grab an even number of digits

744

prefix = bin(id[:l * 2])

744

prefix = bin(id[:l * 2])

745

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

745

nl = [e[7] for e in self.index if e[7].startswith(prefix)]

746

nl = [n for n in nl if hex(n).startswith(id)]

746

nl = [n for n in nl if hex(n).startswith(id)]

747

if len(nl) > 0:

747

if len(nl) > 0:

748

if len(nl) == 1:

748

if len(nl) == 1:

749

self._pcache[id] = nl[0]

749

self._pcache[id] = nl[0]

750

return nl[0]

750

return nl[0]

751

raise LookupError(id, self.indexfile,

751

raise LookupError(id, self.indexfile,

752

_('ambiguous identifier'))

752

_('ambiguous identifier'))

753

return None

753

return None

754

except TypeError:

754

except TypeError:

755

pass

755

pass

756

757

def lookup(self, id):

757

def lookup(self, id):

758

"""locate a node based on:

758

"""locate a node based on:

759

- revision number or str(revision number)

759

- revision number or str(revision number)

760

- nodeid or subset of hex nodeid

760

- nodeid or subset of hex nodeid

761

"""

761

"""

762

n = self._match(id)

762

n = self._match(id)

763

if n is not None:

763

if n is not None:

764

return n

764

return n

765

n = self._partialmatch(id)

765

n = self._partialmatch(id)

766

if n:

766

if n:

767

return n

767

return n

768

769

raise LookupError(id, self.indexfile, _('no match found'))

769

raise LookupError(id, self.indexfile, _('no match found'))

770

771

def cmp(self, node, text):

771

def cmp(self, node, text):

772

"""compare text with a given file revision

772

"""compare text with a given file revision

773

774

returns True if text is different than what is stored.

774

returns True if text is different than what is stored.

775

"""

775

"""

776

p1, p2 = self.parents(node)

776

p1, p2 = self.parents(node)

777

return hash(text, p1, p2) != node

777

return hash(text, p1, p2) != node

778

779

def _addchunk(self, offset, data):

779

def _addchunk(self, offset, data):

780

o, d = self._chunkcache

780

o, d = self._chunkcache

781

# try to add to existing cache

781

# try to add to existing cache

782

if o + len(d) == offset and len(d) + len(data) < _chunksize:

782

if o + len(d) == offset and len(d) + len(data) < _chunksize:

783

self._chunkcache = o, d + data

783

self._chunkcache = o, d + data

784

else:

784

else:

785

self._chunkcache = offset, data

785

self._chunkcache = offset, data

786

787

def _loadchunk(self, offset, length):

787

def _loadchunk(self, offset, length):

788

if self._inline:

788

if self._inline:

789

df = self.opener(self.indexfile)

789

df = self.opener(self.indexfile)

790

else:

790

else:

791

df = self.opener(self.datafile)

791

df = self.opener(self.datafile)

792

793

readahead = max(65536, length)

793

readahead = max(65536, length)

794

df.seek(offset)

794

df.seek(offset)

795

d = df.read(readahead)

795

d = df.read(readahead)

796

self._addchunk(offset, d)

796

self._addchunk(offset, d)

797

if readahead > length:

797

if readahead > length:

798

return d[:length]

798

return d[:length]

799

return d

799

return d

800

801

def _getchunk(self, offset, length):

801

def _getchunk(self, offset, length):

802

o, d = self._chunkcache

802

o, d = self._chunkcache

803

l = len(d)

803

l = len(d)

804

805

# is it in the cache?

805

# is it in the cache?

806

cachestart = offset - o

806

cachestart = offset - o

807

cacheend = cachestart + length

807

cacheend = cachestart + length

808

if cachestart >= 0 and cacheend <= l:

808

if cachestart >= 0 and cacheend <= l:

809

if cachestart == 0 and cacheend == l:

809

if cachestart == 0 and cacheend == l:

810

return d # avoid a copy

810

return d # avoid a copy

811

return d[cachestart:cacheend]

811

return d[cachestart:cacheend]

812

813

return self._loadchunk(offset, length)

813

return self._loadchunk(offset, length)

814

815

def _chunkraw(self, startrev, endrev):

815

def _chunkraw(self, startrev, endrev):

816

start = self.start(startrev)

816

start = self.start(startrev)

817

length = self.end(endrev) - start

817

length = self.end(endrev) - start

818

if self._inline:

818

if self._inline:

819

start += (startrev + 1) * self._io.size

819

start += (startrev + 1) * self._io.size

820

return self._getchunk(start, length)

820

return self._getchunk(start, length)

821

822

def _chunk(self, rev):

822

def _chunk(self, rev):

823

return decompress(self._chunkraw(rev, rev))

823

return decompress(self._chunkraw(rev, rev))

824

825

def _chunkbase(self, rev):

825

def _chunkbase(self, rev):

826

return self._chunk(rev)

826

return self._chunk(rev)

827

828

def _chunkclear(self):

828

def _chunkclear(self):

829

self._chunkcache = (0, '')

829

self._chunkcache = (0, '')

830

831

def deltaparent(self, rev):

831

def deltaparent(self, rev):

832

"""return deltaparent of the given revision"""

832

"""return deltaparent of the given revision"""

833

if self.index[rev][3] == rev:

833

if self.index[rev][3] == rev:

834

return nullrev

834

return nullrev

835

else:

835

else:

836

return rev - 1

836

return rev - 1

837

838

def revdiff(self, rev1, rev2):

838

def revdiff(self, rev1, rev2):

839

"""return or calculate a delta between two revisions"""

839

"""return or calculate a delta between two revisions"""

840

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

840

if rev1 != nullrev and self.deltaparent(rev2) == rev1:

841

return self._chunk(rev2)

841

return self._chunk(rev2)

842

843

return mdiff.textdiff(self.revision(self.node(rev1)),

843

return mdiff.textdiff(self.revision(self.node(rev1)),

844

self.revision(self.node(rev2)))

844

self.revision(self.node(rev2)))

845

846

def revision(self, node):

846

def revision(self, node):

847

"""return an uncompressed revision of a given node"""

847

"""return an uncompressed revision of a given node"""

848

cachedrev = None

848

cachedrev = None

849

if node == nullid:

849

if node == nullid:

850

return ""

850

return ""

851

if self._cache:

851

if self._cache:

852

if self._cache[0] == node:

852

if self._cache[0] == node:

853

return self._cache[2]

853

return self._cache[2]

854

cachedrev = self._cache[1]

854

cachedrev = self._cache[1]

855

856

# look up what we need to read

856

# look up what we need to read

857

text = None

857

text = None

858

rev = self.rev(node)

858

rev = self.rev(node)

859

base = self.base(rev)

859

base = self.base(rev)

860

861

# check rev flags

861

# check rev flags

862

if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:

862

if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:

863

raise RevlogError(_('incompatible revision flag %x') %

863

raise RevlogError(_('incompatible revision flag %x') %

864

(self.flags(rev) & ~REVIDX_KNOWN_FLAGS))

864

(self.flags(rev) & ~REVIDX_KNOWN_FLAGS))

865

866

# build delta chain

866

# build delta chain

867

chain = []

867

chain = []

868

iterrev = rev

868

iterrev = rev

869

while iterrev != base and iterrev != cachedrev:

869

while iterrev != base and iterrev != cachedrev:

870

chain.append(iterrev)

870

chain.append(iterrev)

871

iterrev -= 1

871

iterrev -= 1

872

chain.reverse()

872

chain.reverse()

873

base = iterrev

873

base = iterrev

874

875

if iterrev == cachedrev:

875

if iterrev == cachedrev:

876

# cache hit

876

# cache hit

877

text = self._cache[2]

877

text = self._cache[2]

878

879

# drop cache to save memory

879

# drop cache to save memory

880

self._cache = None

880

self._cache = None

881

882

self._chunkraw(base, rev)

882

self._chunkraw(base, rev)

883

if text is None:

883

if text is None:

884

text = self._chunkbase(base)

884

text = self._chunkbase(base)

885

886

bins = [self._chunk(r) for r in chain]

886

bins = [self._chunk(r) for r in chain]

887

text = mdiff.patches(text, bins)

887

text = mdiff.patches(text, bins)

888

889

text = self._checkhash(text, node, rev)

889

text = self._checkhash(text, node, rev)

890

891

self._cache = (node, rev, text)

891

self._cache = (node, rev, text)

892

return text

892

return text

893

894

def _checkhash(self, text, node, rev):

894

def _checkhash(self, text, node, rev):

895

p1, p2 = self.parents(node)

895

p1, p2 = self.parents(node)

896

if node != hash(text, p1, p2):

896

if node != hash(text, p1, p2):

897

raise RevlogError(_("integrity check failed on %s:%d")

897

raise RevlogError(_("integrity check failed on %s:%d")

898

% (self.indexfile, rev))

898

% (self.indexfile, rev))

899

return text

899

return text

900

901

def checkinlinesize(self, tr, fp=None):

901

def checkinlinesize(self, tr, fp=None):

902

if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:

902

if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:

903

return

903

return

904

905

trinfo = tr.find(self.indexfile)

905

trinfo = tr.find(self.indexfile)

906

if trinfo is None:

906

if trinfo is None:

907

raise RevlogError(_("%s not found in the transaction")

907

raise RevlogError(_("%s not found in the transaction")

908

% self.indexfile)

908

% self.indexfile)

909

910

trindex = trinfo[2]

910

trindex = trinfo[2]

911

dataoff = self.start(trindex)

911

dataoff = self.start(trindex)

912

913

tr.add(self.datafile, dataoff)

913

tr.add(self.datafile, dataoff)

914

915

if fp:

915

if fp:

916

fp.flush()

916

fp.flush()

917

fp.close()

917

fp.close()

918

919

df = self.opener(self.datafile, 'w')

919

df = self.opener(self.datafile, 'w')

920

try:

920

try:

921

for r in self:

921

for r in self:

922

df.write(self._chunkraw(r, r))

922

df.write(self._chunkraw(r, r))

923

finally:

923

finally:

924

df.close()

924

df.close()

925

926

fp = self.opener(self.indexfile, 'w', atomictemp=True)

926

fp = self.opener(self.indexfile, 'w', atomictemp=True)

927

self.version &= ~(REVLOGNGINLINEDATA)

927

self.version &= ~(REVLOGNGINLINEDATA)

928

self._inline = False

928

self._inline = False

929

for i in self:

929

for i in self:

930

e = self._io.packentry(self.index[i], self.node, self.version, i)

930

e = self._io.packentry(self.index[i], self.node, self.version, i)

931

fp.write(e)

931

fp.write(e)

932

933

# if we don't call rename, the temp file will never replace the

933

# if we don't call rename, the temp file will never replace the

934

# real index

934

# real index

935

fp.rename()

935

fp.rename()

936

937

tr.replace(self.indexfile, trindex * self._io.size)

937

tr.replace(self.indexfile, trindex * self._io.size)

938

self._chunkclear()

938

self._chunkclear()

939

940

def addrevision(self, text, transaction, link, p1, p2, cachedelta=None):

940

def addrevision(self, text, transaction, link, p1, p2, cachedelta=None):

941

"""add a revision to the log

941

"""add a revision to the log

942

943

text - the revision data to add

943

text - the revision data to add

944

transaction - the transaction object used for rollback

944

transaction - the transaction object used for rollback

945

link - the linkrev data to add

945

link - the linkrev data to add

946

p1, p2 - the parent nodeids of the revision

946

p1, p2 - the parent nodeids of the revision

947

cachedelta - an optional precomputed delta

947

cachedelta - an optional precomputed delta

948

"""

948

"""

949

node = hash(text, p1, p2)

949

node = hash(text, p1, p2)

950

if node in self.nodemap:

950

if node in self.nodemap:

951

return node

951

return node

952

953

dfh = None

953

dfh = None

954

if not self._inline:

954

if not self._inline:

955

dfh = self.opener(self.datafile, "a")

955

dfh = self.opener(self.datafile, "a")

956

ifh = self.opener(self.indexfile, "a+")

956

ifh = self.opener(self.indexfile, "a+")

957

try:

957

try:

958

return self._addrevision(node, text, transaction, link, p1, p2,

958

return self._addrevision(node, text, transaction, link, p1, p2,

959

cachedelta, ifh, dfh)

959

cachedelta, ifh, dfh)

960

finally:

960

finally:

961

if dfh:

961

if dfh:

962

dfh.close()

962

dfh.close()

963

ifh.close()

963

ifh.close()

964

965

def _addrevision(self, node, text, transaction, link, p1, p2,

965

def _addrevision(self, node, text, transaction, link, p1, p2,

966

cachedelta, ifh, dfh):

966

cachedelta, ifh, dfh):

967

968

btext = [text]

968

btext = [text]

969

def buildtext():

969

def buildtext():

970

if btext[0] is not None:

970

if btext[0] is not None:

971

return btext[0]

971

return btext[0]

972

# flush any pending writes here so we can read it in revision

972

# flush any pending writes here so we can read it in revision

973

if dfh:

973

if dfh:

974

dfh.flush()

974

dfh.flush()

975

ifh.flush()

975

ifh.flush()

976

basetext = self.revision(self.node(cachedelta[0]))

976

basetext = self.revision(self.node(cachedelta[0]))

977

btext[0] = mdiff.patch(basetext, cachedelta[1])

977

btext[0] = mdiff.patch(basetext, cachedelta[1])

978

chk = hash(btext[0], p1, p2)

978

chk = hash(btext[0], p1, p2)

979

if chk != node:

979

if chk != node:

980

raise RevlogError(_("consistency error in delta"))

980

raise RevlogError(_("consistency error in delta"))

981

return btext[0]

981

return btext[0]

982

983

def builddelta(rev):

983

def builddelta(rev):

984

# can we use the cached delta?

984

# can we use the cached delta?

985

if cachedelta and cachedelta[0] == rev:

985

if cachedelta and cachedelta[0] == rev:

986

delta = cachedelta[1]

986

delta = cachedelta[1]

987

else:

987

else:

988

t = buildtext()

988

t = buildtext()

989

ptext = self.revision(self.node(rev))

989

ptext = self.revision(self.node(rev))

990

delta = mdiff.textdiff(ptext, t)

990

delta = mdiff.textdiff(ptext, t)

991

data = compress(delta)

991

data = compress(delta)

992

l = len(data[1]) + len(data[0])

992

l = len(data[1]) + len(data[0])

993

base = self.base(rev)

993

base = self.base(rev)

994

dist = l + offset - self.start(base)

994

dist = l + offset - self.start(base)

995

return dist, l, data, base

995

return dist, l, data, base

996

997

curr = len(self)

997

curr = len(self)

998

prev = curr - 1

998

prev = curr - 1

999

base = curr

999

base = curr

1000

offset = self.end(prev)

1000

offset = self.end(prev)

1001

flags = 0

1001

flags = 0

1002

d = None

1002

d = None

1003

p1r, p2r = self.rev(p1), self.rev(p2)

1003

p1r, p2r = self.rev(p1), self.rev(p2)

1004

1005

# should we try to build a delta?

1005

# should we try to build a delta?

1006

if prev != nullrev:

1006

if prev != nullrev:

1007

d = builddelta(prev)

1007

d = builddelta(prev)

1008

dist, l, data, base = d

1008

dist, l, data, base = d

1009

1010

# full versions are inserted when the needed deltas

1010

# full versions are inserted when the needed deltas

1011

# become comparable to the uncompressed text

1011

# become comparable to the uncompressed text

1012

if text is None:

1012

if text is None:

1013

textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),

1013

textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),

1014

cachedelta[1])

1014

cachedelta[1])

1015

else:

1015

else:

1016

textlen = len(text)

1016

textlen = len(text)

1017

if d is None or dist > textlen * 2:

1017

if d is None or dist > textlen * 2:

1018

text = buildtext()

1018

text = buildtext()

1019

data = compress(text)

1019

data = compress(text)

1020

l = len(data[1]) + len(data[0])

1020

l = len(data[1]) + len(data[0])

1021

base = curr

1021

base = curr

1022

1023

e = (offset_type(offset, flags), l, textlen,

1023

e = (offset_type(offset, flags), l, textlen,

1024

base, link, p1r, p2r, node)

1024

base, link, p1r, p2r, node)

1025

self.index.insert(-1, e)

1025

self.index.insert(-1, e)

1026

self.nodemap[node] = curr

1026

self.nodemap[node] = curr

1027

1028

entry = self._io.packentry(e, self.node, self.version, curr)

1028

entry = self._io.packentry(e, self.node, self.version, curr)

1029

if not self._inline:

1029

if not self._inline:

1030

transaction.add(self.datafile, offset)

1030

transaction.add(self.datafile, offset)

1031

transaction.add(self.indexfile, curr * len(entry))

1031

transaction.add(self.indexfile, curr * len(entry))

1032

if data[0]:

1032

if data[0]:

1033

dfh.write(data[0])

1033

dfh.write(data[0])

1034

dfh.write(data[1])

1034

dfh.write(data[1])

1035

dfh.flush()

1035

dfh.flush()

1036

ifh.write(entry)

1036

ifh.write(entry)

1037

else:

1037

else:

1038

offset += curr * self._io.size

1038

offset += curr * self._io.size

1039

transaction.add(self.indexfile, offset, curr)

1039

transaction.add(self.indexfile, offset, curr)

1040

ifh.write(entry)

1040

ifh.write(entry)

1041

ifh.write(data[0])

1041

ifh.write(data[0])

1042

ifh.write(data[1])

1042

ifh.write(data[1])

1043

self.checkinlinesize(transaction, ifh)

1043

self.checkinlinesize(transaction, ifh)

1044

1045

if type(text) == str: # only accept immutable objects

1045

if type(text) == str: # only accept immutable objects

1046

self._cache = (node, curr, text)

1046

self._cache = (node, curr, text)

1047

return node

1047

return node

1048

1049

def group(self, nodelist, bundler):

1049

def group(self, nodelist, bundler):

1050

"""Calculate a delta group, yielding a sequence of changegroup chunks

1050

"""Calculate a delta group, yielding a sequence of changegroup chunks

1051

(strings).

1051

(strings).

1052

1053

Given a list of changeset revs, return a set of deltas and

1053

Given a list of changeset revs, return a set of deltas and

1054

metadata corresponding to nodes. The first delta is

1054

metadata corresponding to nodes. The first delta is

1055

first parent(nodelist[0]) -> nodelist[0], the receiver is

1055

first parent(nodelist[0]) -> nodelist[0], the receiver is

1056

guaranteed to have this parent as it has all history before

1056

guaranteed to have this parent as it has all history before

1057

these changesets. In the case firstparent is nullrev the

1057

these changesets. In the case firstparent is nullrev the

1058

changegroup starts with a full revision.

1058

changegroup starts with a full revision.

1059

"""

1059

"""

1060

1061

revs = sorted([self.rev(n) for n in nodelist])

1061

revs = sorted([self.rev(n) for n in nodelist])

1062

1063

# if we don't have any revisions touched by these changesets, bail

1063

# if we don't have any revisions touched by these changesets, bail

1064

if not revs:

1064

if not revs:

1065

yield bundler.close()

1065

yield bundler.close()

1066

return

1066

return

1067

1068

# add the parent of the first rev

1068

# add the parent of the first rev

1069

p = self.parentrevs(revs[0])[0]

1069

p = self.parentrevs(revs[0])[0]

1070

revs.insert(0, p)

1070

revs.insert(0, p)

1071

1072

# build deltas

1072

# build deltas

1073

for r in xrange(len(revs) - 1):

1073

for r in xrange(len(revs) - 1):

1074

prev, curr = revs[r], revs[r + 1]

1074

prev, curr = revs[r], revs[r + 1]

1075

for c in bundler.revchunk(self, curr, prev):

1075

for c in bundler.revchunk(self, curr, prev):

1076

yield c

1076

yield c

1077

1078

yield bundler.close()

1078

yield bundler.close()

1079

1080

def addgroup(self, bundle, linkmapper, transaction):

1080

def addgroup(self, bundle, linkmapper, transaction):

1081

"""

1081

"""

1082

add a delta group

1082

add a delta group

1083

1084

given a set of deltas, add them to the revision log. the

1084

given a set of deltas, add them to the revision log. the

1085

first delta is against its parent, which should be in our

1085

first delta is against its parent, which should be in our

1086

log, the rest are against the previous delta.

1086

log, the rest are against the previous delta.

1087

"""

1087

"""

1088

1089

# track the base of the current delta log

1089

# track the base of the current delta log

1090

node = None

1090

node = None

1091

1092

r = len(self)

1092

r = len(self)

1093

end = 0

1093

end = 0

1094

if r:

1094

if r:

1095

end = self.end(r - 1)

1095

end = self.end(r - 1)

1096

ifh = self.opener(self.indexfile, "a+")

1096

ifh = self.opener(self.indexfile, "a+")

1097

isize = r * self._io.size

1097

isize = r * self._io.size

1098

if self._inline:

1098

if self._inline:

1099

transaction.add(self.indexfile, end + isize, r)

1099

transaction.add(self.indexfile, end + isize, r)

1100

dfh = None

1100

dfh = None

1101

else:

1101

else:

1102

transaction.add(self.indexfile, isize, r)

1102

transaction.add(self.indexfile, isize, r)

1103

transaction.add(self.datafile, end)

1103

transaction.add(self.datafile, end)

1104

dfh = self.opener(self.datafile, "a")

1104

dfh = self.opener(self.datafile, "a")

1105

1106

try:

1106

try:

1107

# loop through our set of deltas

1107

# loop through our set of deltas

1108

chain = None

1108

chain = None

1109

while 1:

1109

while 1:

1110

chunkdata = bundle.deltachunk(chain)

1110

chunkdata = bundle.deltachunk(chain)

1111

if not chunkdata:

1111

if not chunkdata:

1112

break

1112

break

1113

node = chunkdata['node']

1113

node = chunkdata['node']

1114

p1 = chunkdata['p1']

1114

p1 = chunkdata['p1']

1115

p2 = chunkdata['p2']

1115

p2 = chunkdata['p2']

1116

cs = chunkdata['cs']

1116

cs = chunkdata['cs']

1117

deltabase = chunkdata['deltabase']

1117

deltabase = chunkdata['deltabase']

1118

delta = chunkdata['delta']

1118

delta = chunkdata['delta']

1119

1120

link = linkmapper(cs)

1120

link = linkmapper(cs)

1121

if node in self.nodemap:

1121

if node in self.nodemap:

1122

# this can happen if two branches make the same change

1122

# this can happen if two branches make the same change

1123

chain = node

1123

chain = node

1124

continue

1124

continue

1125

1126

for p in (p1, p2):

1126

for p in (p1, p2):

1127

if not p in self.nodemap:

1127

if not p in self.nodemap:

1128

raise LookupError(p, self.indexfile,

1128

raise LookupError(p, self.indexfile,

1129

_('unknown parent'))

1129

_('unknown parent'))

1130

1131

if deltabase not in self.nodemap:

1131

if deltabase not in self.nodemap:

1132

raise LookupError(deltabase, self.indexfile,

1132

raise LookupError(deltabase, self.indexfile,

1133

_('unknown delta base'))

1133

_('unknown delta base'))

1134

1135

baserev = self.rev(deltabase)

1135

baserev = self.rev(deltabase)

1136

chain = self._addrevision(node, None, transaction, link,

1136

chain = self._addrevision(node, None, transaction, link,

1137

p1, p2, (baserev, delta), ifh, dfh)

1137

p1, p2, (baserev, delta), ifh, dfh)

1138

if not dfh and not self._inline:

1138

if not dfh and not self._inline:

1139

# addrevision switched from inline to conventional

1139

# addrevision switched from inline to conventional

1140

# reopen the index

1140

# reopen the index

1141

ifh.close()

1141

ifh.close()

1142

dfh = self.opener(self.datafile, "a")

1142

dfh = self.opener(self.datafile, "a")

1143

ifh = self.opener(self.indexfile, "a")

1143

ifh = self.opener(self.indexfile, "a")

1144

finally:

1144

finally:

1145

if dfh:

1145

if dfh:

1146

dfh.close()

1146

dfh.close()

1147

ifh.close()

1147

ifh.close()

1148

1149

return node

1149

return node

1150

1151

def strip(self, minlink, transaction):

1151

def strip(self, minlink, transaction):

1152

"""truncate the revlog on the first revision with a linkrev >= minlink

1152

"""truncate the revlog on the first revision with a linkrev >= minlink

1153

1154

This function is called when we're stripping revision minlink and

1154

This function is called when we're stripping revision minlink and

1155

its descendants from the repository.

1155

its descendants from the repository.

1156

1157

We have to remove all revisions with linkrev >= minlink, because

1157

We have to remove all revisions with linkrev >= minlink, because

1158

the equivalent changelog revisions will be renumbered after the

1158

the equivalent changelog revisions will be renumbered after the

1159

strip.

1159

strip.

1160

1161

So we truncate the revlog on the first of these revisions, and

1161

So we truncate the revlog on the first of these revisions, and

1162

trust that the caller has saved the revisions that shouldn't be

1162

trust that the caller has saved the revisions that shouldn't be

1163

removed and that it'll readd them after this truncation.

1163

removed and that it'll readd them after this truncation.

1164

"""

1164

"""

1165

if len(self) == 0:

1165

if len(self) == 0:

1166

return

1166

return

1167

1168

for rev in self:

1168

for rev in self:

1169

if self.index[rev][4] >= minlink:

1169

if self.index[rev][4] >= minlink:

1170

break

1170

break

1171

else:

1171

else:

1172

return

1172

return

1173

1174

# first truncate the files on disk

1174

# first truncate the files on disk

1175

end = self.start(rev)

1175

end = self.start(rev)

1176

if not self._inline:

1176

if not self._inline:

1177

transaction.add(self.datafile, end)

1177

transaction.add(self.datafile, end)

1178

end = rev * self._io.size

1178

end = rev * self._io.size

1179

else:

1179

else:

1180

end += rev * self._io.size

1180

end += rev * self._io.size

1181

1182

transaction.add(self.indexfile, end)

1182

transaction.add(self.indexfile, end)

1183

1184

# then reset internal state in memory to forget those revisions

1184

# then reset internal state in memory to forget those revisions

1185

self._cache = None

1185

self._cache = None

1186

self._chunkclear()

1186

self._chunkclear()

1187

for x in xrange(rev, len(self)):

1187

for x in xrange(rev, len(self)):

1188

del self.nodemap[self.node(x)]

1188

del self.nodemap[self.node(x)]

1189

1190

del self.index[rev:-1]

1190

del self.index[rev:-1]

1191

1192

def checksize(self):

1192

def checksize(self):

1193

expected = 0

1193

expected = 0

1194

if len(self):

1194

if len(self):

1195

expected = max(0, self.end(len(self) - 1))

1195

expected = max(0, self.end(len(self) - 1))

1196

1197

try:

1197

try:

1198

f = self.opener(self.datafile)

1198

f = self.opener(self.datafile)

1199

f.seek(0, 2)

1199

f.seek(0, 2)

1200

actual = f.tell()

1200

actual = f.tell()

1201

f.close()

1201

f.close()

1202

dd = actual - expected

1202

dd = actual - expected

1203

except IOError, inst:

1203

except IOError, inst:

1204

if inst.errno != errno.ENOENT:

1204

if inst.errno != errno.ENOENT:

1205

raise

1205

raise

1206

dd = 0

1206

dd = 0

1207

1208

try:

1208

try:

1209

f = self.opener(self.indexfile)

1209

f = self.opener(self.indexfile)

1210

f.seek(0, 2)

1210

f.seek(0, 2)

1211

actual = f.tell()

1211

actual = f.tell()

1212

f.close()

1212

f.close()

1213

s = self._io.size

1213

s = self._io.size

1214

i = max(0, actual // s)

1214

i = max(0, actual // s)

1215

di = actual - (i * s)

1215

di = actual - (i * s)

1216

if self._inline:

1216

if self._inline:

1217

databytes = 0

1217

databytes = 0

1218

for r in self:

1218

for r in self:

1219

databytes += max(0, self.length(r))

1219

databytes += max(0, self.length(r))

1220

dd = 0

1220

dd = 0

1221

di = actual - len(self) * s - databytes

1221

di = actual - len(self) * s - databytes

1222

except IOError, inst:

1222

except IOError, inst:

1223

if inst.errno != errno.ENOENT:

1223

if inst.errno != errno.ENOENT:

1224

raise

1224

raise

1225

di = 0

1225

di = 0

1226

1227

return (dd, di)

1227

return (dd, di)

1228

1229

def files(self):

1229

def files(self):

1230

res = [self.indexfile]

1230

res = [self.indexfile]

1231

if not self._inline:

1231

if not self._inline:

1232

res.append(self.datafile)

1232

res.append(self.datafile)

1233

return res

1233

return res

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # revlog.py - storage back-end for mercurial
             #
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             """Storage back-end for Mercurial.
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches.
             """
             # import stuff from node for others to import from revlog
             from node import bin, hex, nullid, nullrev, short #@UnusedImport
             from i18n import _
             import ancestor, mdiff, parsers, error, util
             import struct, zlib, errno
             _pack = struct.pack
             _unpack = struct.unpack
             _compress = zlib.compress
             _decompress = zlib.decompress
             _sha = util.sha1
             # revlog header flags
             REVLOGV0 = 0
             REVLOGNG = 1
             REVLOGNGINLINEDATA = (1 << 16)
             REVLOGSHALLOW = (1 << 17)
             REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA
             REVLOG_DEFAULT_FORMAT = REVLOGNG
             REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS
             REVLOGNG_FLAGS = REVLOGNGINLINEDATA | REVLOGSHALLOW
             # revlog index flags
             REVIDX_KNOWN_FLAGS = 0
             # max size of revlog with inline data
             _maxinline = 131072
             _chunksize = 1048576
             RevlogError = error.RevlogError
             LookupError = error.LookupError
             def getoffset(q):
                 return int(q >> 16)
             def gettype(q):
                 return int(q & 0xFFFF)
             def offset_type(offset, type):
                 return long(long(offset) << 16 | type)
             nullhash = _sha(nullid)
             def hash(text, p1, p2):
                 """generate a hash from the given text and its parent hashes
                 This hash combines both the current file contents and its history
                 in a manner that makes it easy to distinguish nodes with the same
                 content in the revision graph.
                 """
                 # As of now, if one of the parent node is null, p2 is null
                 if p2 == nullid:
                     # deep copy of a hash is faster than creating one
                     s = nullhash.copy()
                     s.update(p1)
                 else:
                     # none of the parent nodes are nullid
                     l = [p1, p2]
                     l.sort()
                     s = _sha(l[0])
                     s.update(l[1])
                 s.update(text)
                 return s.digest()
             def compress(text):
                 """ generate a possibly-compressed representation of text """
                 if not text:
                     return ("", text)
                 l = len(text)
                 bin = None
                 if l < 44:
                     pass
                 elif l > 1000000:
                     # zlib makes an internal copy, thus doubling memory usage for
                     # large files, so lets do this in pieces
                     z = zlib.compressobj()
                     p = []
                     pos = 0
                     while pos < l:
                         pos2 = pos + 2**20
                         p.append(z.compress(text[pos:pos2]))
                         pos = pos2
                     p.append(z.flush())
                     if sum(map(len, p)) < l:
                         bin = "".join(p)
                 else:
                     bin = _compress(text)
                 if bin is None or len(bin) > l:
                     if text[0] == '\0':
                         return ("", text)
                     return ('u', text)
                 return ("", bin)
             def decompress(bin):
                 """ decompress the given input """
                 if not bin:
                     return bin
                 t = bin[0]
                 if t == '\0':
                     return bin
                 if t == 'x':
                     return _decompress(bin)
                 if t == 'u':
                     return bin[1:]
                 raise RevlogError(_("unknown compression type %r") % t)
             indexformatv0 = ">4l20s20s20s"
             v0shaoffset = 56
             class revlogoldio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatv0)
                 def parseindex(self, data, inline):
                     s = self.size
                     index = []
                     nodemap =  {nullid: nullrev}
                     n = off = 0
                     l = len(data)
                     while off + s <= l:
                         cur = data[off:off + s]
                         off += s
                         e = _unpack(indexformatv0, cur)
                         # transform to revlogv1 format
                         e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],
                               nodemap.get(e[4], nullrev), nodemap.get(e[5], nullrev), e[6])
                         index.append(e2)
                         nodemap[e[6]] = n
                         n += 1
                     # add the magic null revision at -1
                     index.append((0, 0, 0, -1, -1, -1, -1, nullid))
                     return index, nodemap, None
                 def packentry(self, entry, node, version, rev):
                     if gettype(entry[0]):
                         raise RevlogError(_("index entry flags need RevlogNG"))
                     e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],
                           node(entry[5]), node(entry[6]), entry[7])
                     return _pack(indexformatv0, *e2)
             # index ng:
             #  6 bytes: offset
             #  2 bytes: flags
             #  4 bytes: compressed length
             #  4 bytes: uncompressed length
             #  4 bytes: base rev
             #  4 bytes: link rev
             #  4 bytes: parent 1 rev
             #  4 bytes: parent 2 rev
             # 32 bytes: nodeid
             indexformatng = ">Qiiiiii20s12x"
             ngshaoffset = 32
             versionformat = ">I"
             class revlogio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatng)
                 def parseindex(self, data, inline):
                     # call the C implementation to parse the index data
                     index, cache = parsers.parse_index2(data, inline)
                     return index, None, cache
                 def packentry(self, entry, node, version, rev):
                     p = _pack(indexformatng, *entry)
                     if rev == 0:
                         p = _pack(versionformat, version) + p[4:]
                     return p
             class revlog(object):
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, including its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 """
                 def __init__(self, opener, indexfile, shallowroot=None):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     """
                     self.indexfile = indexfile
                     self.datafile = indexfile[:-2] + ".d"
                     self.opener = opener
                     self._cache = None
                     self._chunkcache = (0, '')
                     self.index = []
                     self._shallowroot = shallowroot
                     self._pcache = {}
                     self._nodecache = {nullid: nullrev}
                     self._nodepos = None
                     v = REVLOG_DEFAULT_VERSION
                     if hasattr(opener, 'options') and 'defversion' in opener.options:
                         v = opener.options['defversion']
                         if v & REVLOGNG:
                             v |= REVLOGNGINLINEDATA
                     if shallowroot:
                         v |= REVLOGSHALLOW
                     i = ''
                     try:
                         f = self.opener(self.indexfile)
                         i = f.read()
                         f.close()
                         if len(i) > 0:
                             v = struct.unpack(versionformat, i[:4])[0]
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                     self.version = v
                     self._inline = v & REVLOGNGINLINEDATA
                     self._shallow = v & REVLOGSHALLOW
                     flags = v & ~0xFFFF
                     fmt = v & 0xFFFF
                     if fmt == REVLOGV0 and flags:
                         raise RevlogError(_("index %s unknown flags %#04x for format v0")
                                           % (self.indexfile, flags >> 16))
                     elif fmt == REVLOGNG and flags & ~REVLOGNG_FLAGS:
                         raise RevlogError(_("index %s unknown flags %#04x for revlogng")
                                           % (self.indexfile, flags >> 16))
                     elif fmt > REVLOGNG:
                         raise RevlogError(_("index %s unknown format %d")
                                           % (self.indexfile, fmt))
                     self._io = revlogio()
                     if self.version == REVLOGV0:
                         self._io = revlogoldio()
                     try:
                         d = self._io.parseindex(i, self._inline)
                     except (ValueError, IndexError):
                         raise RevlogError(_("index %s is corrupted") % (self.indexfile))
                     self.index, nodemap, self._chunkcache = d
                     if nodemap is not None:
                         self.nodemap = self._nodecache = nodemap
                     if not self._chunkcache:
                         self._chunkclear()
                 def tip(self):
                     return self.node(len(self.index) - 2)
                 def __len__(self):
                     return len(self.index) - 1
                 def __iter__(self):
                     for i in xrange(len(self)):
                         yield i
                 @util.propertycache
                 def nodemap(self):
                     self.rev(self.node(0))
                     return self._nodecache
                 def rev(self, node):
                     try:
                         return self._nodecache[node]
                     except KeyError:
                         n = self._nodecache
                         i = self.index
                         p = self._nodepos
                         if p is None:
                             p = len(i) - 2
                         for r in xrange(p, -1, -1):
                             v = i[r][7]
                             n[v] = r
                             if v == node:
                                 self._nodepos = r - 1
                                 return r
                         raise LookupError(node, self.indexfile, _('no node'))
                 def node(self, rev):
                     return self.index[rev][7]
                 def linkrev(self, rev):
                     return self.index[rev][4]
                 def parents(self, node):
                     i = self.index
                     d = i[self.rev(node)]
                     return i[d[5]][7], i[d[6]][7] # map revisions to nodes inline
                 def parentrevs(self, rev):
                     return self.index[rev][5:7]
                 def start(self, rev):
                     return int(self.index[rev][0] >> 16)
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def length(self, rev):
                     return self.index[rev][1]
                 def base(self, rev):
                     return self.index[rev][3]
                 def flags(self, rev):
                     return self.index[rev][0] & 0xFFFF
                 def rawsize(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.revision(self.node(rev))
                     return len(t)
                 size = rawsize
                 def reachable(self, node, stop=None):
                     """return the set of all nodes ancestral to a given node, including
                      the node itself, stopping when stop is matched"""
                     reachable = set((node,))
                     visit = [node]
                     if stop:
                         stopn = self.rev(stop)
                     else:
                         stopn = 0
                     while visit:
                         n = visit.pop(0)
                         if n == stop:
                             continue
                         if n == nullid:
                             continue
                         for p in self.parents(n):
                             if self.rev(p) < stopn:
                                 continue
                             if p not in reachable:
                                 reachable.add(p)
                                 visit.append(p)
                     return reachable
                 def ancestors(self, *revs):
                     """Generate the ancestors of 'revs' in reverse topological order.
                     Yield a sequence of revision numbers starting with the parents
                     of each revision in revs, i.e., each revision is *not* considered
                     an ancestor of itself.  Results are in breadth-first order:
                     parents of each rev in revs, then parents of those, etc.  Result
                     does not include the null revision."""
                     visit = list(revs)
                     seen = set([nullrev])
                     while visit:
                         for parent in self.parentrevs(visit.pop(0)):
                             if parent not in seen:
                                 visit.append(parent)
                                 seen.add(parent)
                                 yield parent
                 def descendants(self, *revs):
                     """Generate the descendants of 'revs' in revision order.
                     Yield a sequence of revision numbers starting with a child of
                     some rev in revs, i.e., each revision is *not* considered a
                     descendant of itself.  Results are ordered by revision number (a
                     topological sort)."""
                     first = min(revs)
                     if first == nullrev:
                         for i in self:
                             yield i
                         return
                     seen = set(revs)
                     for i in xrange(first + 1, len(self)):
                         for x in self.parentrevs(i):
                             if x != nullrev and x in seen:
                                 seen.add(i)
                                 yield i
                                 break
                 def findcommonmissing(self, common=None, heads=None):
                     """Return a tuple of the ancestors of common and the ancestors of heads
                     that are not ancestors of common.
                     More specifically, the second element is a list of nodes N such that
                     every N satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     if common is None:
                         common = [nullid]
                     if heads is None:
                         heads = self.heads()
                     common = [self.rev(n) for n in common]
                     heads = [self.rev(n) for n in heads]
                     # we want the ancestors, but inclusive
                     has = set(self.ancestors(*common))
                     has.add(nullrev)
                     has.update(common)
                     # take all ancestors from heads that aren't in has
                     missing = set()
                     visit = [r for r in heads if r not in has]
                     while visit:
                         r = visit.pop(0)
                         if r in missing:
                             continue
                         else:
                             missing.add(r)
                             for p in self.parentrevs(r):
                                 if p not in has:
                                     visit.append(p)
                     missing = list(missing)
                     missing.sort()
                     return has, [self.node(r) for r in missing]
                 def findmissing(self, common=None, heads=None):
                     """Return the ancestors of heads that are not ancestors of common.
                     More specifically, return a list of nodes N such that every N
                     satisfies the following constraints:
 . N is an ancestor of some node in 'heads'
 . N is not an ancestor of any node in 'common'
                     The list is sorted by revision number, meaning it is
                     topologically sorted.
                     'heads' and 'common' are both lists of node IDs.  If heads is
                     not supplied, uses all of the revlog's heads.  If common is not
                     supplied, uses nullid."""
                     _common, missing = self.findcommonmissing(common, heads)
                     return missing
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a topological path from 'roots' to 'heads'.
                     Return a tuple (nodes, outroots, outheads) where 'nodes' is a
                     topologically sorted list of all nodes N that satisfy both of
                     these constraints:
 . N is a descendant of some node in 'roots'
 . N is an ancestor of some node in 'heads'
                     Every node is considered to be both a descendant and an ancestor
                     of itself, so every reachable node in 'roots' and 'heads' will be
                     included in 'nodes'.
                     'outroots' is the list of reachable nodes in 'roots', i.e., the
                     subset of 'roots' that is returned in 'nodes'.  Likewise,
                     'outheads' is the subset of 'heads' that is also in 'nodes'.
                     'roots' and 'heads' are both lists of node IDs.  If 'roots' is
                     unspecified, uses nullid as the only root.  If 'heads' is
                     unspecified, uses list of all of the revlog's heads."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [nullid] # Everybody's a descendent of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return ([self.node(r) for r in self], [nullid], list(self.heads()))
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = len(self) - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = set()
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
-                        heads = dict.fromkeys(heads, 0)
+                        heads = dict.fromkeys(heads, False)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = set(heads)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendent of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors.add(n) # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.update([p for p in self.parents(n) if
                                                        p != nullid])
                                 elif n in heads: # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [n for n in roots if n in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(n) for n in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [nullid]
                     # Transform our roots list into a set.
                     descendents = set(roots)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendents.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descedents, empty parents will look like
                     # they're descendents.
                     for r in xrange(max(lowestrev, 0), highestrev + 1):
                         n = self.node(r)
                         isdescendent = False
                         if lowestrev == nullrev:  # Everybody is a descendent of nullid
                             isdescendent = True
                         elif n in descendents:
                             # n is already a descendent
                             isdescendent = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendents before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendents, it's not a root.
                                 if (p[0] in descendents) or (p[1] in descendents):
                                     roots.remove(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendent if either of its parents are
                             # descendents.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendents) or (p[1] in descendents):
                                 descendents.add(n)
                                 isdescendent = True
                         if isdescendent and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendents and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
-                                heads[n] = 1
+                                heads[n] = True
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
-                                heads[n] = 1
+                                heads[n] = True
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
-                    heads = [n for n in heads.iterkeys() if heads[n] != 0]
+                    heads = [n for n, flag in heads.iteritems() if flag]
                     roots = list(roots)
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def headrevs(self):
                     count = len(self)
                     if not count:
                         return [nullrev]
                     ishead = [1] * (count + 1)
                     index = self.index
                     for r in xrange(count):
                         e = index[r]
                         ishead[e[5]] = ishead[e[6]] = 0
                     return [r for r in xrange(count) if ishead[r]]
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None and stop is None:
                         if not len(self):
                             return [nullid]
                         return [self.node(r) for r in self.headrevs()]
                     if start is None:
                         start = nullid
                     if stop is None:
                         stop = []
                     stoprevs = set([self.rev(n) for n in stop])
                     startrev = self.rev(start)
                     reachable = set((startrev,))
                     heads = set((startrev,))
                     parentrevs = self.parentrevs
                     for r in xrange(startrev + 1, len(self)):
                         for p in parentrevs(r):
                             if p in reachable:
                                 if r not in stoprevs:
                                     reachable.add(r)
                                 heads.add(r)
                             if p in heads and p not in stoprevs:
                                 heads.remove(p)
                     return [self.node(r) for r in heads]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in range(p + 1, len(self)):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def descendant(self, start, end):
                     if start == nullrev:
                         return True
                     for i in self.descendants(start):
                         if i == end:
                             return True
                         elif i > end:
                             break
                     return False
                 def ancestor(self, a, b):
                     """calculate the least common ancestor of nodes a and b"""
                     # fast path, check if it is a descendant
                     a, b = self.rev(a), self.rev(b)
                     start, end = sorted((a, b))
                     if self.descendant(start, end):
                         return self.node(start)
                     def parents(rev):
                         return [p for p in self.parentrevs(rev) if p != nullrev]
                     c = ancestor.ancestor(a, b, parents)
                     if c is None:
                         return nullid
                     return self.node(c)
                 def _match(self, id):
                     if isinstance(id, (long, int)):
                         # rev
                         return self.node(id)
                     if len(id) == 20:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             self.rev(node) # quick search the index
                             return node
                         except LookupError:
                             pass # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if str(rev) != id:
                             raise ValueError
                         if rev < 0:
                             rev = len(self) + rev
                         if rev < 0 or rev >= len(self):
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 40:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             self.rev(node)
                             return node
                         except (TypeError, LookupError):
                             pass
                 def _partialmatch(self, id):
                     if id in self._pcache:
                         return self._pcache[id]
                     if len(id) < 40:
                         try:
                             # hex(node)[:...]
                             l = len(id) // 2  # grab an even number of digits
                             prefix = bin(id[:l * 2])
                             nl = [e[7] for e in self.index if e[7].startswith(prefix)]
                             nl = [n for n in nl if hex(n).startswith(id)]
                             if len(nl) > 0:
                                 if len(nl) == 1:
                                     self._pcache[id] = nl[0]
                                     return nl[0]
                                 raise LookupError(id, self.indexfile,
                                                   _('ambiguous identifier'))
                             return None
                         except TypeError:
                             pass
                 def lookup(self, id):
                     """locate a node based on:
                         - revision number or str(revision number)
                         - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise LookupError(id, self.indexfile, _('no match found'))
                 def cmp(self, node, text):
                     """compare text with a given file revision
                     returns True if text is different than what is stored.
                     """
                     p1, p2 = self.parents(node)
                     return hash(text, p1, p2) != node
                 def _addchunk(self, offset, data):
                     o, d = self._chunkcache
                     # try to add to existing cache
                     if o + len(d) == offset and len(d) + len(data) < _chunksize:
                         self._chunkcache = o, d + data
                     else:
                         self._chunkcache = offset, data
                 def _loadchunk(self, offset, length):
                     if self._inline:
                         df = self.opener(self.indexfile)
                     else:
                         df = self.opener(self.datafile)
                     readahead = max(65536, length)
                     df.seek(offset)
                     d = df.read(readahead)
                     self._addchunk(offset, d)
                     if readahead > length:
                         return d[:length]
                     return d
                 def _getchunk(self, offset, length):
                     o, d = self._chunkcache
                     l = len(d)
                     # is it in the cache?
                     cachestart = offset - o
                     cacheend = cachestart + length
                     if cachestart >= 0 and cacheend <= l:
                         if cachestart == 0 and cacheend == l:
                             return d # avoid a copy
                         return d[cachestart:cacheend]
                     return self._loadchunk(offset, length)
                 def _chunkraw(self, startrev, endrev):
                     start = self.start(startrev)
                     length = self.end(endrev) - start
                     if self._inline:
                         start += (startrev + 1) * self._io.size
                     return self._getchunk(start, length)
                 def _chunk(self, rev):
                     return decompress(self._chunkraw(rev, rev))
                 def _chunkbase(self, rev):
                     return self._chunk(rev)
                 def _chunkclear(self):
                     self._chunkcache = (0, '')
                 def deltaparent(self, rev):
                     """return deltaparent of the given revision"""
                     if self.index[rev][3] == rev:
                         return nullrev
                     else:
                         return rev - 1
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions"""
                     if rev1 != nullrev and self.deltaparent(rev2) == rev1:
                         return self._chunk(rev2)
                     return mdiff.textdiff(self.revision(self.node(rev1)),
                                           self.revision(self.node(rev2)))
                 def revision(self, node):
                     """return an uncompressed revision of a given node"""
                     cachedrev = None
                     if node == nullid:
                         return ""
                     if self._cache:
                         if self._cache[0] == node:
                             return self._cache[2]
                         cachedrev = self._cache[1]
                     # look up what we need to read
                     text = None
                     rev = self.rev(node)
                     base = self.base(rev)
                     # check rev flags
                     if self.flags(rev) & ~REVIDX_KNOWN_FLAGS:
                         raise RevlogError(_('incompatible revision flag %x') %
                                           (self.flags(rev) & ~REVIDX_KNOWN_FLAGS))
                     # build delta chain
                     chain = []
                     iterrev = rev
                     while iterrev != base and iterrev != cachedrev:
                         chain.append(iterrev)
                         iterrev -= 1
                     chain.reverse()
                     base = iterrev
                     if iterrev == cachedrev:
                         # cache hit
                         text = self._cache[2]
                     # drop cache to save memory
                     self._cache = None
                     self._chunkraw(base, rev)
                     if text is None:
                         text = self._chunkbase(base)
                     bins = [self._chunk(r) for r in chain]
                     text = mdiff.patches(text, bins)
                     text = self._checkhash(text, node, rev)
                     self._cache = (node, rev, text)
                     return text
                 def _checkhash(self, text, node, rev):
                     p1, p2 = self.parents(node)
                     if node != hash(text, p1, p2):
                         raise RevlogError(_("integrity check failed on %s:%d")
                                           % (self.indexfile, rev))
                     return text
                 def checkinlinesize(self, tr, fp=None):
                     if not self._inline or (self.start(-2) + self.length(-2)) < _maxinline:
                         return
                     trinfo = tr.find(self.indexfile)
                     if trinfo is None:
                         raise RevlogError(_("%s not found in the transaction")
                                           % self.indexfile)
                     trindex = trinfo[2]
                     dataoff = self.start(trindex)
                     tr.add(self.datafile, dataoff)
                     if fp:
                         fp.flush()
                         fp.close()
                     df = self.opener(self.datafile, 'w')
                     try:
                         for r in self:
                             df.write(self._chunkraw(r, r))
                     finally:
                         df.close()
                     fp = self.opener(self.indexfile, 'w', atomictemp=True)
                     self.version &= ~(REVLOGNGINLINEDATA)
                     self._inline = False
                     for i in self:
                         e = self._io.packentry(self.index[i], self.node, self.version, i)
                         fp.write(e)
                     # if we don't call rename, the temp file will never replace the
                     # real index
                     fp.rename()
                     tr.replace(self.indexfile, trindex * self._io.size)
                     self._chunkclear()
                 def addrevision(self, text, transaction, link, p1, p2, cachedelta=None):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     cachedelta - an optional precomputed delta
                     """
                     node = hash(text, p1, p2)
                     if node in self.nodemap:
                         return node
                     dfh = None
                     if not self._inline:
                         dfh = self.opener(self.datafile, "a")
                     ifh = self.opener(self.indexfile, "a+")
                     try:
                         return self._addrevision(node, text, transaction, link, p1, p2,
                                                  cachedelta, ifh, dfh)
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                 def _addrevision(self, node, text, transaction, link, p1, p2,
                                  cachedelta, ifh, dfh):
                     btext = [text]
                     def buildtext():
                         if btext[0] is not None:
                             return btext[0]
                         # flush any pending writes here so we can read it in revision
                         if dfh:
                             dfh.flush()
                         ifh.flush()
                         basetext = self.revision(self.node(cachedelta[0]))
                         btext[0] = mdiff.patch(basetext, cachedelta[1])
                         chk = hash(btext[0], p1, p2)
                         if chk != node:
                             raise RevlogError(_("consistency error in delta"))
                         return btext[0]
                     def builddelta(rev):
                         # can we use the cached delta?
                         if cachedelta and cachedelta[0] == rev:
                             delta = cachedelta[1]
                         else:
                             t = buildtext()
                             ptext = self.revision(self.node(rev))
                             delta = mdiff.textdiff(ptext, t)
                         data = compress(delta)
                         l = len(data[1]) + len(data[0])
                         base = self.base(rev)
                         dist = l + offset - self.start(base)
                         return dist, l, data, base
                     curr = len(self)
                     prev = curr - 1
                     base = curr
                     offset = self.end(prev)
                     flags = 0
                     d = None
                     p1r, p2r = self.rev(p1), self.rev(p2)
                     # should we try to build a delta?
                     if prev != nullrev:
                         d = builddelta(prev)
                         dist, l, data, base = d
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if text is None:
                         textlen = mdiff.patchedsize(self.rawsize(cachedelta[0]),
                                                     cachedelta[1])
                     else:
                         textlen = len(text)
                     if d is None or dist > textlen * 2:
                         text = buildtext()
                         data = compress(text)
                         l = len(data[1]) + len(data[0])
                         base = curr
                     e = (offset_type(offset, flags), l, textlen,
                          base, link, p1r, p2r, node)
                     self.index.insert(-1, e)
                     self.nodemap[node] = curr
                     entry = self._io.packentry(e, self.node, self.version, curr)
                     if not self._inline:
                         transaction.add(self.datafile, offset)
                         transaction.add(self.indexfile, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         dfh.flush()
                         ifh.write(entry)
                     else:
                         offset += curr * self._io.size
                         transaction.add(self.indexfile, offset, curr)
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                         self.checkinlinesize(transaction, ifh)
                     if type(text) == str: # only accept immutable objects
                         self._cache = (node, curr, text)
                     return node
                 def group(self, nodelist, bundler):
                     """Calculate a delta group, yielding a sequence of changegroup chunks
                     (strings).
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. The first delta is
                     first parent(nodelist[0]) -> nodelist[0], the receiver is
                     guaranteed to have this parent as it has all history before
                     these changesets. In the case firstparent is nullrev the
                     changegroup starts with a full revision.
                     """
                     revs = sorted([self.rev(n) for n in nodelist])
                     # if we don't have any revisions touched by these changesets, bail
                     if not revs:
                         yield bundler.close()
                         return
                     # add the parent of the first rev
                     p = self.parentrevs(revs[0])[0]
                     revs.insert(0, p)
                     # build deltas
                     for r in xrange(len(revs) - 1):
                         prev, curr = revs[r], revs[r + 1]
                         for c in bundler.revchunk(self, curr, prev):
                             yield c
                     yield bundler.close()
                 def addgroup(self, bundle, linkmapper, transaction):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     """
                     # track the base of the current delta log
                     node = None
                     r = len(self)
                     end = 0
                     if r:
                         end = self.end(r - 1)
                     ifh = self.opener(self.indexfile, "a+")
                     isize = r * self._io.size
                     if self._inline:
                         transaction.add(self.indexfile, end + isize, r)
                         dfh = None
                     else:
                         transaction.add(self.indexfile, isize, r)
                         transaction.add(self.datafile, end)
                         dfh = self.opener(self.datafile, "a")
                     try:
                         # loop through our set of deltas
                         chain = None
                         while 1:
                             chunkdata = bundle.deltachunk(chain)
                             if not chunkdata:
                                 break
                             node = chunkdata['node']
                             p1 = chunkdata['p1']
                             p2 = chunkdata['p2']
                             cs = chunkdata['cs']
                             deltabase = chunkdata['deltabase']
                             delta = chunkdata['delta']
                             link = linkmapper(cs)
                             if node in self.nodemap:
                                 # this can happen if two branches make the same change
                                 chain = node
                                 continue
                             for p in (p1, p2):
                                 if not p in self.nodemap:
                                     raise LookupError(p, self.indexfile,
                                                       _('unknown parent'))
                             if deltabase not in self.nodemap:
                                 raise LookupError(deltabase, self.indexfile,
                                                   _('unknown delta base'))
                             baserev = self.rev(deltabase)
                             chain = self._addrevision(node, None, transaction, link,
                                                       p1, p2, (baserev, delta), ifh, dfh)
                             if not dfh and not self._inline:
                                 # addrevision switched from inline to conventional
                                 # reopen the index
                                 ifh.close()
                                 dfh = self.opener(self.datafile, "a")
                                 ifh = self.opener(self.indexfile, "a")
                     finally:
                         if dfh:
                             dfh.close()
                         ifh.close()
                     return node
                 def strip(self, minlink, transaction):
                     """truncate the revlog on the first revision with a linkrev >= minlink
                     This function is called when we're stripping revision minlink and
                     its descendants from the repository.
                     We have to remove all revisions with linkrev >= minlink, because
                     the equivalent changelog revisions will be renumbered after the
                     strip.
                     So we truncate the revlog on the first of these revisions, and
                     trust that the caller has saved the revisions that shouldn't be
                     removed and that it'll readd them after this truncation.
                     """
                     if len(self) == 0:
                         return
                     for rev in self:
                         if self.index[rev][4] >= minlink:
                             break
                     else:
                         return
                     # first truncate the files on disk
                     end = self.start(rev)
                     if not self._inline:
                         transaction.add(self.datafile, end)
                         end = rev * self._io.size
                     else:
                         end += rev * self._io.size
                     transaction.add(self.indexfile, end)
                     # then reset internal state in memory to forget those revisions
                     self._cache = None
                     self._chunkclear()
                     for x in xrange(rev, len(self)):
                         del self.nodemap[self.node(x)]
                     del self.index[rev:-1]
                 def checksize(self):
                     expected = 0
                     if len(self):
                         expected = max(0, self.end(len(self) - 1))
                     try:
                         f = self.opener(self.datafile)
                         f.seek(0, 2)
                         actual = f.tell()
                         f.close()
                         dd = actual - expected
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         dd = 0
                     try:
                         f = self.opener(self.indexfile)
                         f.seek(0, 2)
                         actual = f.tell()
                         f.close()
                         s = self._io.size
                         i = max(0, actual // s)
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in self:
                                 databytes += max(0, self.length(r))
                             dd = 0
                             di = actual - len(self) * s - databytes
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         di = 0
                     return (dd, di)
                 def files(self):
                     res = [self.indexfile]
                     if not self._inline:
                         res.append(self.datafile)
                     return res