upstream/mercurial-mirror Commit - r2138:f5046cab

1

"""

1

"""

2

revlog.py - storage back-end for mercurial

2

revlog.py - storage back-end for mercurial

3

4

This provides efficient delta storage with O(1) retrieve and append

4

This provides efficient delta storage with O(1) retrieve and append

5

and O(changes) merge between branches

5

and O(changes) merge between branches

6

7

8

9

This software may be used and distributed according to the terms

9

This software may be used and distributed according to the terms

10

of the GNU General Public License, incorporated herein by reference.

10

of the GNU General Public License, incorporated herein by reference.

11

"""

11

"""

12

13

from node import *

13

from node import *

14

from i18n import gettext as _

14

from i18n import gettext as _

15

from demandload import demandload

15

from demandload import demandload

16

demandload(globals(), "binascii changegroup errno heapq mdiff os")

16

demandload(globals(), "binascii changegroup errno heapq mdiff os")

17

demandload(globals(), "sha struct zlib")

17

demandload(globals(), "sha struct zlib")

18

19

# revlog version strings

19

# revlog version strings

20

REVLOGV0 = 0

20

REVLOGV0 = 0

21

REVLOGNG = 1

21

REVLOGNG = 1

22

23

# revlog flags

23

# revlog flags

24

REVLOGNGINLINEDATA = (1 << 16)

24

REVLOGNGINLINEDATA = (1 << 16)

25

26

def flagstr(flag):

26

def flagstr(flag):

27

if flag == "inline":

27

if flag == "inline":

28

return REVLOGNGINLINEDATA

28

return REVLOGNGINLINEDATA

29

raise RevlogError(_("unknown revlog flag %s" % flag))

29

raise RevlogError(_("unknown revlog flag %s" % flag))

30

31

def hash(text, p1, p2):

31

def hash(text, p1, p2):

32

"""generate a hash from the given text and its parent hashes

32

"""generate a hash from the given text and its parent hashes

33

34

This hash combines both the current file contents and its history

34

This hash combines both the current file contents and its history

35

in a manner that makes it easy to distinguish nodes with the same

35

in a manner that makes it easy to distinguish nodes with the same

36

content in the revision graph.

36

content in the revision graph.

37

"""

37

"""

38

l = [p1, p2]

38

l = [p1, p2]

39

l.sort()

39

l.sort()

40

s = sha.new(l[0])

40

s = sha.new(l[0])

41

s.update(l[1])

41

s.update(l[1])

42

s.update(text)

42

s.update(text)

43

return s.digest()

43

return s.digest()

44

45

def compress(text):

45

def compress(text):

46

""" generate a possibly-compressed representation of text """

46

""" generate a possibly-compressed representation of text """

47

if not text: return ("", text)

47

if not text: return ("", text)

48

if len(text) < 44:

48

if len(text) < 44:

49

if text[0] == '\0': return ("", text)

49

if text[0] == '\0': return ("", text)

50

return ('u', text)

50

return ('u', text)

51

bin = zlib.compress(text)

51

bin = zlib.compress(text)

52

if len(bin) > len(text):

52

if len(bin) > len(text):

53

if text[0] == '\0': return ("", text)

53

if text[0] == '\0': return ("", text)

54

return ('u', text)

54

return ('u', text)

55

return ("", bin)

55

return ("", bin)

56

57

def decompress(bin):

57

def decompress(bin):

58

""" decompress the given input """

58

""" decompress the given input """

59

if not bin: return bin

59

if not bin: return bin

60

t = bin[0]

60

t = bin[0]

61

if t == '\0': return bin

61

if t == '\0': return bin

62

if t == 'x': return zlib.decompress(bin)

62

if t == 'x': return zlib.decompress(bin)

63

if t == 'u': return bin[1:]

63

if t == 'u': return bin[1:]

64

raise RevlogError(_("unknown compression type %r") % t)

64

raise RevlogError(_("unknown compression type %r") % t)

65

66

indexformatv0 = ">4l20s20s20s"

66

indexformatv0 = ">4l20s20s20s"

67

v0shaoffset = 56

67

v0shaoffset = 56

68

# index ng:

68

# index ng:

69

# 6 bytes offset

69

# 6 bytes offset

70

# 2 bytes flags

70

# 2 bytes flags

71

# 4 bytes compressed length

71

# 4 bytes compressed length

72

# 4 bytes uncompressed length

72

# 4 bytes uncompressed length

73

# 4 bytes: base rev

73

# 4 bytes: base rev

74

# 4 bytes link rev

74

# 4 bytes link rev

75

# 4 bytes parent 1 rev

75

# 4 bytes parent 1 rev

76

# 4 bytes parent 2 rev

76

# 4 bytes parent 2 rev

77

# 32 bytes: nodeid

77

# 32 bytes: nodeid

78

indexformatng = ">Qiiiiii20s12x"

78

indexformatng = ">Qiiiiii20s12x"

79

ngshaoffset = 32

79

ngshaoffset = 32

80

versionformat = ">i"

80

versionformat = ">i"

81

82

class lazyparser(object):

82

class lazyparser(object):

83

"""

83

"""

84

this class avoids the need to parse the entirety of large indices

84

this class avoids the need to parse the entirety of large indices

85

"""

85

"""

86

def __init__(self, dataf, size, indexformat, shaoffset):

86

def __init__(self, dataf, size, indexformat, shaoffset):

87

self.dataf = dataf

87

self.dataf = dataf

88

self.format = indexformat

88

self.format = indexformat

89

self.s = struct.calcsize(indexformat)

89

self.s = struct.calcsize(indexformat)

90

self.indexformat = indexformat

90

self.indexformat = indexformat

91

self.datasize = size

91

self.datasize = size

92

self.l = size/self.s

92

self.l = size/self.s

93

self.index = [None] * self.l

93

self.index = [None] * self.l

94

self.map = {nullid: -1}

94

self.map = {nullid: -1}

95

self.allmap = 0

95

self.allmap = 0

96

self.all = 0

96

self.all = 0

97

self.mapfind_count = 0

97

self.mapfind_count = 0

98

self.shaoffset = shaoffset

98

self.shaoffset = shaoffset

99

100

def loadmap(self):

100

def loadmap(self):

101

"""

101

"""

102

during a commit, we need to make sure the rev being added is

102

during a commit, we need to make sure the rev being added is

103

not a duplicate. This requires loading the entire index,

103

not a duplicate. This requires loading the entire index,

104

which is fairly slow. loadmap can load up just the node map,

104

which is fairly slow. loadmap can load up just the node map,

105

which takes much less time.

105

which takes much less time.

106

"""

106

"""

107

if self.allmap: return

107

if self.allmap: return

108

start = 0

108

start = 0

109

end = self.datasize

109

end = self.datasize

110

self.allmap = 1

110

self.allmap = 1

111

cur = 0

111

cur = 0

112

count = 0

112

count = 0

113

blocksize = self.s * 256

113

blocksize = self.s * 256

114

self.dataf.seek(0)

114

self.dataf.seek(0)

115

while cur < end:

115

while cur < end:

116

data = self.dataf.read(blocksize)

116

data = self.dataf.read(blocksize)

117

off = 0

117

off = 0

118

for x in xrange(256):

118

for x in xrange(256):

119

n = data[off + self.shaoffset:off + self.shaoffset + 20]

119

n = data[off + self.shaoffset:off + self.shaoffset + 20]

120

self.map[n] = count

120

self.map[n] = count

121

count += 1

121

count += 1

122

if count >= self.l:

122

if count >= self.l:

123

break

123

break

124

off += self.s

124

off += self.s

125

cur += blocksize

125

cur += blocksize

126

127

def loadblock(self, blockstart, blocksize, data=None):

127

def loadblock(self, blockstart, blocksize, data=None):

128

if self.all: return

128

if self.all: return

129

if data is None:

129

if data is None:

130

self.dataf.seek(blockstart)

130

self.dataf.seek(blockstart)

131

data = self.dataf.read(blocksize)

131

data = self.dataf.read(blocksize)

132

lend = len(data) / self.s

132

lend = len(data) / self.s

133

i = blockstart / self.s

133

i = blockstart / self.s

134

off = 0

134

off = 0

135

for x in xrange(lend):

135

for x in xrange(lend):

136

if self.index[i + x] == None:

136

if self.index[i + x] == None:

137

b = data[off : off + self.s]

137

b = data[off : off + self.s]

138

self.index[i + x] = b

138

self.index[i + x] = b

139

n = b[self.shaoffset:self.shaoffset + 20]

139

n = b[self.shaoffset:self.shaoffset + 20]

140

self.map[n] = i + x

140

self.map[n] = i + x

141

off += self.s

141

off += self.s

142

143

def findnode(self, node):

143

def findnode(self, node):

144

"""search backwards through the index file for a specific node"""

144

"""search backwards through the index file for a specific node"""

145

if self.allmap: return None

145

if self.allmap: return None

146

147

# hg log will cause many many searches for the manifest

147

# hg log will cause many many searches for the manifest

148

# nodes. After we get called a few times, just load the whole

148

# nodes. After we get called a few times, just load the whole

149

# thing.

149

# thing.

150

if self.mapfind_count > 8:

150

if self.mapfind_count > 8:

151

self.loadmap()

151

self.loadmap()

152

if node in self.map:

152

if node in self.map:

153

return node

153

return node

154

return None

154

return None

155

self.mapfind_count += 1

155

self.mapfind_count += 1

156

last = self.l - 1

156

last = self.l - 1

157

while self.index[last] != None:

157

while self.index[last] != None:

158

if last == 0:

158

if last == 0:

159

self.all = 1

159

self.all = 1

160

self.allmap = 1

160

self.allmap = 1

161

return None

161

return None

162

last -= 1

162

last -= 1

163

end = (last + 1) * self.s

163

end = (last + 1) * self.s

164

blocksize = self.s * 256

164

blocksize = self.s * 256

165

while end >= 0:

165

while end >= 0:

166

start = max(end - blocksize, 0)

166

start = max(end - blocksize, 0)

167

self.dataf.seek(start)

167

self.dataf.seek(start)

168

data = self.dataf.read(end - start)

168

data = self.dataf.read(end - start)

169

findend = end - start

169

findend = end - start

170

while True:

170

while True:

171

# we're searching backwards, so weh have to make sure

171

# we're searching backwards, so weh have to make sure

172

# we don't find a changeset where this node is a parent

172

# we don't find a changeset where this node is a parent

173

off = data.rfind(node, 0, findend)

173

off = data.rfind(node, 0, findend)

174

findend = off

174

findend = off

175

if off >= 0:

175

if off >= 0:

176

i = off / self.s

176

i = off / self.s

177

off = i * self.s

177

off = i * self.s

178

n = data[off + self.shaoffset:off + self.shaoffset + 20]

178

n = data[off + self.shaoffset:off + self.shaoffset + 20]

179

if n == node:

179

if n == node:

180

self.map[n] = i + start / self.s

180

self.map[n] = i + start / self.s

181

return node

181

return node

182

else:

182

else:

183

break

183

break

184

end -= blocksize

184

end -= blocksize

185

return None

185

return None

186

187

def loadindex(self, i=None, end=None):

187

def loadindex(self, i=None, end=None):

188

if self.all: return

188

if self.all: return

189

all = False

189

all = False

190

if i == None:

190

if i == None:

191

blockstart = 0

191

blockstart = 0

192

blocksize = (512 / self.s) * self.s

192

blocksize = (512 / self.s) * self.s

193

end = self.datasize

193

end = self.datasize

194

all = True

194

all = True

195

else:

195

else:

196

if end:

196

if end:

197

blockstart = i * self.s

197

blockstart = i * self.s

198

end = end * self.s

198

end = end * self.s

199

blocksize = end - blockstart

199

blocksize = end - blockstart

200

else:

200

else:

201

blockstart = (i & ~(32)) * self.s

201

blockstart = (i & ~(32)) * self.s

202

blocksize = self.s * 64

202

blocksize = self.s * 64

203

end = blockstart + blocksize

203

end = blockstart + blocksize

204

while blockstart < end:

204

while blockstart < end:

205

self.loadblock(blockstart, blocksize)

205

self.loadblock(blockstart, blocksize)

206

blockstart += blocksize

206

blockstart += blocksize

207

if all: self.all = True

207

if all: self.all = True

208

209

class lazyindex(object):

209

class lazyindex(object):

210

"""a lazy version of the index array"""

210

"""a lazy version of the index array"""

211

def __init__(self, parser):

211

def __init__(self, parser):

212

self.p = parser

212

self.p = parser

213

def __len__(self):

213

def __len__(self):

214

return len(self.p.index)

214

return len(self.p.index)

215

def load(self, pos):

215

def load(self, pos):

216

if pos < 0:

216

if pos < 0:

217

pos += len(self.p.index)

217

pos += len(self.p.index)

218

self.p.loadindex(pos)

218

self.p.loadindex(pos)

219

return self.p.index[pos]

219

return self.p.index[pos]

220

def __getitem__(self, pos):

220

def __getitem__(self, pos):

221

ret = self.p.index[pos] or self.load(pos)

221

ret = self.p.index[pos] or self.load(pos)

222

if isinstance(ret, str):

222

if isinstance(ret, str):

223

ret = struct.unpack(self.p.indexformat, ret)

223

ret = struct.unpack(self.p.indexformat, ret)

224

return ret

224

return ret

225

def __setitem__(self, pos, item):

225

def __setitem__(self, pos, item):

226

self.p.index[pos] = item

226

self.p.index[pos] = item

227

def __delitem__(self, pos):

227

def __delitem__(self, pos):

228

del self.p.index[pos]

228

del self.p.index[pos]

229

def append(self, e):

229

def append(self, e):

230

self.p.index.append(e)

230

self.p.index.append(e)

231

232

class lazymap(object):

232

class lazymap(object):

233

"""a lazy version of the node map"""

233

"""a lazy version of the node map"""

234

def __init__(self, parser):

234

def __init__(self, parser):

235

self.p = parser

235

self.p = parser

236

def load(self, key):

236

def load(self, key):

237

n = self.p.findnode(key)

237

n = self.p.findnode(key)

238

if n == None:

238

if n == None:

239

raise KeyError(key)

239

raise KeyError(key)

240

def __contains__(self, key):

240

def __contains__(self, key):

241

if key in self.p.map:

241

if key in self.p.map:

242

return True

242

return True

243

self.p.loadmap()

243

self.p.loadmap()

244

return key in self.p.map

244

return key in self.p.map

245

def __iter__(self):

245

def __iter__(self):

246

yield nullid

246

yield nullid

247

for i in xrange(self.p.l):

247

for i in xrange(self.p.l):

248

ret = self.p.index[i]

248

ret = self.p.index[i]

249

if not ret:

249

if not ret:

250

self.p.loadindex(i)

250

self.p.loadindex(i)

251

ret = self.p.index[i]

251

ret = self.p.index[i]

252

if isinstance(ret, str):

252

if isinstance(ret, str):

253

ret = struct.unpack(self.p.indexformat, ret)

253

ret = struct.unpack(self.p.indexformat, ret)

254

yield ret[-1]

254

yield ret[-1]

255

def __getitem__(self, key):

255

def __getitem__(self, key):

256

try:

256

try:

257

return self.p.map[key]

257

return self.p.map[key]

258

except KeyError:

258

except KeyError:

259

try:

259

try:

260

self.load(key)

260

self.load(key)

261

return self.p.map[key]

261

return self.p.map[key]

262

except KeyError:

262

except KeyError:

263

raise KeyError("node " + hex(key))

263

raise KeyError("node " + hex(key))

264

def __setitem__(self, key, val):

264

def __setitem__(self, key, val):

265

self.p.map[key] = val

265

self.p.map[key] = val

266

def __delitem__(self, key):

266

def __delitem__(self, key):

267

del self.p.map[key]

267

del self.p.map[key]

268

269

class RevlogError(Exception): pass

269

class RevlogError(Exception): pass

270

271

class revlog(object):

271

class revlog(object):

272

"""

272

"""

273

the underlying revision storage object

273

the underlying revision storage object

274

275

A revlog consists of two parts, an index and the revision data.

275

A revlog consists of two parts, an index and the revision data.

276

277

The index is a file with a fixed record size containing

277

The index is a file with a fixed record size containing

278

information on each revision, includings its nodeid (hash), the

278

information on each revision, includings its nodeid (hash), the

279

nodeids of its parents, the position and offset of its data within

279

nodeids of its parents, the position and offset of its data within

280

the data file, and the revision it's based on. Finally, each entry

280

the data file, and the revision it's based on. Finally, each entry

281

contains a linkrev entry that can serve as a pointer to external

281

contains a linkrev entry that can serve as a pointer to external

282

data.

282

data.

283

284

The revision data itself is a linear collection of data chunks.

284

The revision data itself is a linear collection of data chunks.

285

Each chunk represents a revision and is usually represented as a

285

Each chunk represents a revision and is usually represented as a

286

delta against the previous chunk. To bound lookup time, runs of

286

delta against the previous chunk. To bound lookup time, runs of

287

deltas are limited to about 2 times the length of the original

287

deltas are limited to about 2 times the length of the original

288

version data. This makes retrieval of a version proportional to

288

version data. This makes retrieval of a version proportional to

289

its size, or O(1) relative to the number of revisions.

289

its size, or O(1) relative to the number of revisions.

290

291

Both pieces of the revlog are written to in an append-only

291

Both pieces of the revlog are written to in an append-only

292

fashion, which means we never need to rewrite a file to insert or

292

fashion, which means we never need to rewrite a file to insert or

293

remove data, and can use some simple techniques to avoid the need

293

remove data, and can use some simple techniques to avoid the need

294

for locking while reading.

294

for locking while reading.

295

"""

295

"""

296

def __init__(self, opener, indexfile, datafile, defversion=0):

296

def __init__(self, opener, indexfile, datafile, defversion=0):

297

"""

297

"""

298

create a revlog object

298

create a revlog object

299

300

opener is a function that abstracts the file opening operation

300

opener is a function that abstracts the file opening operation

301

and can be used to implement COW semantics or the like.

301

and can be used to implement COW semantics or the like.

302

"""

302

"""

303

self.indexfile = indexfile

303

self.indexfile = indexfile

304

self.datafile = datafile

304

self.datafile = datafile

305

self.opener = opener

305

self.opener = opener

306

307

self.indexstat = None

307

self.indexstat = None

308

self.cache = None

308

self.cache = None

309

self.chunkcache = None

309

self.chunkcache = None

310

self.defversion = defversion

310

self.defversion = defversion

311

self.load()

311

self.load()

312

313

def load(self):

313

def load(self):

314

v = self.defversion

314

v = self.defversion

315

try:

315

try:

316

f = self.opener(self.indexfile)

316

f = self.opener(self.indexfile)

317

i = f.read(4)

317

i = f.read(4)

318

f.seek(0)

318

f.seek(0)

319

except IOError, inst:

319

except IOError, inst:

320

if inst.errno != errno.ENOENT:

320

if inst.errno != errno.ENOENT:

321

raise

321

raise

322

i = ""

322

i = ""

323

else:

323

else:

324

try:

324

try:

325

st = os.fstat(f.fileno())

325

st = os.fstat(f.fileno())

326

except AttributeError, inst:

326

except AttributeError, inst:

327

st = None

327

st = None

328

else:

328

else:

329

oldst = self.indexstat

329

oldst = self.indexstat

330

if (oldst and st.st_dev == oldst.st_dev

330

if (oldst and st.st_dev == oldst.st_dev

331

and st.st_ino == oldst.st_ino

331

and st.st_ino == oldst.st_ino

332

and st.st_mtime == oldst.st_mtime

332

and st.st_mtime == oldst.st_mtime

333

and st.st_ctime == oldst.st_ctime):

333

and st.st_ctime == oldst.st_ctime):

334

return

334

return

335

self.indexstat = st

335

self.indexstat = st

336

if len(i) > 0:

336

if len(i) > 0:

337

v = struct.unpack(versionformat, i)[0]

337

v = struct.unpack(versionformat, i)[0]

338

flags = v & ~0xFFFF

338

flags = v & ~0xFFFF

339

fmt = v & 0xFFFF

339

fmt = v & 0xFFFF

340

if fmt == 0:

340

if fmt == 0:

341

if flags:

341

if flags:

342

raise RevlogError(_("index %s invalid flags %x for format v0" %

342

raise RevlogError(_("index %s invalid flags %x for format v0" %

343

(self.indexfile, flags)))

343

(self.indexfile, flags)))

344

elif fmt == REVLOGNG:

344

elif fmt == REVLOGNG:

345

if flags & ~REVLOGNGINLINEDATA:

345

if flags & ~REVLOGNGINLINEDATA:

346

raise RevlogError(_("index %s invalid flags %x for revlogng" %

346

raise RevlogError(_("index %s invalid flags %x for revlogng" %

347

(self.indexfile, flags)))

347

(self.indexfile, flags)))

348

else:

348

else:

349

raise RevlogError(_("index %s invalid format %d" %

349

raise RevlogError(_("index %s invalid format %d" %

350

(self.indexfile, fmt)))

350

(self.indexfile, fmt)))

351

self.version = v

351

self.version = v

352

if v == 0:

352

if v == 0:

353

self.indexformat = indexformatv0

353

self.indexformat = indexformatv0

354

shaoffset = v0shaoffset

354

shaoffset = v0shaoffset

355

else:

355

else:

356

self.indexformat = indexformatng

356

self.indexformat = indexformatng

357

shaoffset = ngshaoffset

357

shaoffset = ngshaoffset

358

359

if i:

359

if i:

360

if not self.inlinedata() and st and st.st_size > 10000:

360

if not self.inlinedata() and st and st.st_size > 10000:

361

# big index, let's parse it on demand

361

# big index, let's parse it on demand

362

parser = lazyparser(f, st.st_size, self.indexformat, shaoffset)

362

parser = lazyparser(f, st.st_size, self.indexformat, shaoffset)

363

self.index = lazyindex(parser)

363

self.index = lazyindex(parser)

364

self.nodemap = lazymap(parser)

364

self.nodemap = lazymap(parser)

365

else:

365

else:

366

i = f.read()

366

i = f.read()

367

self.parseindex(i)

367

self.parseindex(i)

368

if self.inlinedata():

368

if self.inlinedata():

369

# we've already got the entire data file read in, save it

369

# we've already got the entire data file read in, save it

370

# in the chunk data

370

# in the chunk data

371

self.chunkcache = (0, i)

371

self.chunkcache = (0, i)

372

if self.version != 0:

372

if self.version != 0:

373

e = list(self.index[0])

373

e = list(self.index[0])

374

type = self.ngtype(e[0])

374

type = self.ngtype(e[0])

375

e[0] = self.offset_type(0, type)

375

e[0] = self.offset_type(0, type)

376

self.index[0] = e

376

self.index[0] = e

377

else:

377

else:

378

self.nodemap = { nullid: -1}

378

self.nodemap = { nullid: -1}

379

self.index = []

379

self.index = []

380

381

382

def parseindex(self, data):

382

def parseindex(self, data):

383

s = struct.calcsize(self.indexformat)

383

s = struct.calcsize(self.indexformat)

384

l = len(data)

384

l = len(data)

385

self.index = []

385

self.index = []

386

self.nodemap = {nullid: -1}

386

self.nodemap = {nullid: -1}

387

inline = self.inlinedata()

387

inline = self.inlinedata()

388

off = 0

388

off = 0

389

n = 0

389

n = 0

390

while off < l:

390

while off < l:

391

e = struct.unpack(self.indexformat, data[off:off + s])

391

e = struct.unpack(self.indexformat, data[off:off + s])

392

self.index.append(e)

392

self.index.append(e)

393

self.nodemap[e[-1]] = n

393

self.nodemap[e[-1]] = n

394

n += 1

394

n += 1

395

off += s

395

off += s

396

if inline:

396

if inline:

397

off += e[1]

397

off += e[1]

398

399

def ngoffset(self, q):

399

def ngoffset(self, q):

400

if q & 0xFFFF:

400

if q & 0xFFFF:

401

raise RevlogError(_('%s: incompatible revision flag %x') %

401

raise RevlogError(_('%s: incompatible revision flag %x') %

402

(self.indexfile, type))

402

(self.indexfile, type))

403

return long(q >> 16)

403

return long(q >> 16)

404

405

def ngtype(self, q):

405

def ngtype(self, q):

406

return int(q & 0xFFFF)

406

return int(q & 0xFFFF)

407

408

def offset_type(self, offset, type):

408

def offset_type(self, offset, type):

409

return long(long(offset) << 16 | type)

409

return long(long(offset) << 16 | type)

410

411

def loadindex(self, start, end):

411

def loadindex(self, start, end):

412

"""load a block of indexes all at once from the lazy parser"""

412

"""load a block of indexes all at once from the lazy parser"""

413

if isinstance(self.index, lazyindex):

413

if isinstance(self.index, lazyindex):

414

self.index.p.loadindex(start, end)

414

self.index.p.loadindex(start, end)

415

416

def loadindexmap(self):

416

def loadindexmap(self):

417

"""loads both the map and the index from the lazy parser"""

417

"""loads both the map and the index from the lazy parser"""

418

if isinstance(self.index, lazyindex):

418

if isinstance(self.index, lazyindex):

419

p = self.index.p

419

p = self.index.p

420

p.loadindex()

420

p.loadindex()

421

self.nodemap = p.map

421

self.nodemap = p.map

422

423

def loadmap(self):

423

def loadmap(self):

424

"""loads the map from the lazy parser"""

424

"""loads the map from the lazy parser"""

425

if isinstance(self.nodemap, lazymap):

425

if isinstance(self.nodemap, lazymap):

426

self.nodemap.p.loadmap()

426

self.nodemap.p.loadmap()

427

self.nodemap = self.nodemap.p.map

427

self.nodemap = self.nodemap.p.map

428

429

def inlinedata(self): return self.version & REVLOGNGINLINEDATA

429

def inlinedata(self): return self.version & REVLOGNGINLINEDATA

430

def tip(self): return self.node(len(self.index) - 1)

430

def tip(self): return self.node(len(self.index) - 1)

431

def count(self): return len(self.index)

431

def count(self): return len(self.index)

432

def node(self, rev):

432

def node(self, rev):

433

return (rev < 0) and nullid or self.index[rev][-1]

433

return (rev < 0) and nullid or self.index[rev][-1]

434

def rev(self, node):

434

def rev(self, node):

435

try:

435

try:

436

return self.nodemap[node]

436

return self.nodemap[node]

437

except KeyError:

437

except KeyError:

438

raise RevlogError(_('%s: no node %s') % (self.indexfile, hex(node)))

438

raise RevlogError(_('%s: no node %s') % (self.indexfile, hex(node)))

439

def linkrev(self, node): return self.index[self.rev(node)][-4]

439

def linkrev(self, node): return self.index[self.rev(node)][-4]

440

def parents(self, node):

440

def parents(self, node):

441

if node == nullid: return (nullid, nullid)

441

if node == nullid: return (nullid, nullid)

442

r = self.rev(node)

442

r = self.rev(node)

443

d = self.index[r][-3:-1]

443

d = self.index[r][-3:-1]

444

if self.version == 0:

444

if self.version == 0:

445

return d

445

return d

446

return [ self.node(x) for x in d ]

446

return [ self.node(x) for x in d ]

447

def start(self, rev):

447

def start(self, rev):

448

if rev < 0:

448

if rev < 0:

449

return -1

449

return -1

450

if self.version != 0:

450

if self.version != 0:

451

return self.ngoffset(self.index[rev][0])

451

return self.ngoffset(self.index[rev][0])

452

return self.index[rev][0]

452

return self.index[rev][0]

453

454

def end(self, rev): return self.start(rev) + self.length(rev)

454

def end(self, rev): return self.start(rev) + self.length(rev)

455

456

def size(self, rev):

456

def size(self, rev):

457

"""return the length of the uncompressed text for a given revision"""

457

"""return the length of the uncompressed text for a given revision"""

458

l = -1

458

l = -1

459

if self.version != 0:

459

if self.version != 0:

460

l = self.index[rev][2]

460

l = self.index[rev][2]

461

if l >= 0:

461

if l >= 0:

462

return l

462

return l

463

464

t = self.revision(self.node(rev))

464

t = self.revision(self.node(rev))

465

return len(t)

465

return len(t)

466

467

# alternate implementation, The advantage to this code is it

467

# alternate implementation, The advantage to this code is it

468

# will be faster for a single revision. But, the results are not

468

# will be faster for a single revision. But, the results are not

469

# cached, so finding the size of every revision will be slower.

469

# cached, so finding the size of every revision will be slower.

470

"""

470

"""

471

if self.cache and self.cache[1] == rev:

471

if self.cache and self.cache[1] == rev:

472

return len(self.cache[2])

472

return len(self.cache[2])

473

474

base = self.base(rev)

474

base = self.base(rev)

475

if self.cache and self.cache[1] >= base and self.cache[1] < rev:

475

if self.cache and self.cache[1] >= base and self.cache[1] < rev:

476

base = self.cache[1]

476

base = self.cache[1]

477

text = self.cache[2]

477

text = self.cache[2]

478

else:

478

else:

479

text = self.revision(self.node(base))

479

text = self.revision(self.node(base))

480

481

l = len(text)

481

l = len(text)

482

for x in xrange(base + 1, rev + 1):

482

for x in xrange(base + 1, rev + 1):

483

l = mdiff.patchedsize(l, self.chunk(x))

483

l = mdiff.patchedsize(l, self.chunk(x))

484

return l

484

return l

485

"""

485

"""

486

487

def length(self, rev):

487

def length(self, rev):

488

if rev < 0:

488

if rev < 0:

489

return 0

489

return 0

490

else:

490

else:

491

return self.index[rev][1]

491

return self.index[rev][1]

492

def base(self, rev): return (rev < 0) and rev or self.index[rev][-5]

492

def base(self, rev): return (rev < 0) and rev or self.index[rev][-5]

493

494

def reachable(self, rev, stop=None):

494

def reachable(self, rev, stop=None):

495

reachable = {}

495

reachable = {}

496

visit = [rev]

496

visit = [rev]

497

reachable[rev] = 1

497

reachable[rev] = 1

498

if stop:

498

if stop:

499

stopn = self.rev(stop)

499

stopn = self.rev(stop)

500

else:

500

else:

501

stopn = 0

501

stopn = 0

502

while visit:

502

while visit:

503

n = visit.pop(0)

503

n = visit.pop(0)

504

if n == stop:

504

if n == stop:

505

continue

505

continue

506

if n == nullid:

506

if n == nullid:

507

continue

507

continue

508

for p in self.parents(n):

508

for p in self.parents(n):

509

if self.rev(p) < stopn:

509

if self.rev(p) < stopn:

510

continue

510

continue

511

if p not in reachable:

511

if p not in reachable:

512

reachable[p] = 1

512

reachable[p] = 1

513

visit.append(p)

513

visit.append(p)

514

return reachable

514

return reachable

515

516

def nodesbetween(self, roots=None, heads=None):

516

def nodesbetween(self, roots=None, heads=None):

517

"""Return a tuple containing three elements. Elements 1 and 2 contain

517

"""Return a tuple containing three elements. Elements 1 and 2 contain

518

a final list bases and heads after all the unreachable ones have been

518

a final list bases and heads after all the unreachable ones have been

519

pruned. Element 0 contains a topologically sorted list of all

519

pruned. Element 0 contains a topologically sorted list of all

520

521

nodes that satisfy these constraints:

521

nodes that satisfy these constraints:

522

1. All nodes must be descended from a node in roots (the nodes on

522

1. All nodes must be descended from a node in roots (the nodes on

523

roots are considered descended from themselves).

523

roots are considered descended from themselves).

524

2. All nodes must also be ancestors of a node in heads (the nodes in

524

2. All nodes must also be ancestors of a node in heads (the nodes in

525

heads are considered to be their own ancestors).

525

heads are considered to be their own ancestors).

526

527

If roots is unspecified, nullid is assumed as the only root.

527

If roots is unspecified, nullid is assumed as the only root.

528

If heads is unspecified, it is taken to be the output of the

528

If heads is unspecified, it is taken to be the output of the

529

heads method (i.e. a list of all nodes in the repository that

529

heads method (i.e. a list of all nodes in the repository that

530

have no children)."""

530

have no children)."""

531

nonodes = ([], [], [])

531

nonodes = ([], [], [])

532

if roots is not None:

532

if roots is not None:

533

roots = list(roots)

533

roots = list(roots)

534

if not roots:

534

if not roots:

535

return nonodes

535

return nonodes

536

lowestrev = min([self.rev(n) for n in roots])

536

lowestrev = min([self.rev(n) for n in roots])

537

else:

537

else:

538

roots = [nullid] # Everybody's a descendent of nullid

538

roots = [nullid] # Everybody's a descendent of nullid

539

lowestrev = -1

539

lowestrev = -1

540

if (lowestrev == -1) and (heads is None):

540

if (lowestrev == -1) and (heads is None):

541

# We want _all_ the nodes!

541

# We want _all_ the nodes!

542

return ([self.node(r) for r in xrange(0, self.count())],

542

return ([self.node(r) for r in xrange(0, self.count())],

543

[nullid], list(self.heads()))

543

[nullid], list(self.heads()))

544

if heads is None:

544

if heads is None:

545

# All nodes are ancestors, so the latest ancestor is the last

545

# All nodes are ancestors, so the latest ancestor is the last

546

# node.

546

# node.

547

highestrev = self.count() - 1

547

highestrev = self.count() - 1

548

# Set ancestors to None to signal that every node is an ancestor.

548

# Set ancestors to None to signal that every node is an ancestor.

549

ancestors = None

549

ancestors = None

550

# Set heads to an empty dictionary for later discovery of heads

550

# Set heads to an empty dictionary for later discovery of heads

551

heads = {}

551

heads = {}

552

else:

552

else:

553

heads = list(heads)

553

heads = list(heads)

554

if not heads:

554

if not heads:

555

return nonodes

555

return nonodes

556

ancestors = {}

556

ancestors = {}

557

# Start at the top and keep marking parents until we're done.

557

# Start at the top and keep marking parents until we're done.

558

nodestotag = heads[:]

558

nodestotag = heads[:]

559

# Turn heads into a dictionary so we can remove 'fake' heads.

559

# Turn heads into a dictionary so we can remove 'fake' heads.

560

# Also, later we will be using it to filter out the heads we can't

560

# Also, later we will be using it to filter out the heads we can't

561

# find from roots.

561

# find from roots.

562

heads = dict.fromkeys(heads, 0)

562

heads = dict.fromkeys(heads, 0)

563

# Remember where the top was so we can use it as a limit later.

563

# Remember where the top was so we can use it as a limit later.

564

highestrev = max([self.rev(n) for n in nodestotag])

564

highestrev = max([self.rev(n) for n in nodestotag])

565

while nodestotag:

565

while nodestotag:

566

# grab a node to tag

566

# grab a node to tag

567

n = nodestotag.pop()

567

n = nodestotag.pop()

568

# Never tag nullid

568

# Never tag nullid

569

if n == nullid:

569

if n == nullid:

570

continue

570

continue

571

# A node's revision number represents its place in a

571

# A node's revision number represents its place in a

572

# topologically sorted list of nodes.

572

# topologically sorted list of nodes.

573

r = self.rev(n)

573

r = self.rev(n)

574

if r >= lowestrev:

574

if r >= lowestrev:

575

if n not in ancestors:

575

if n not in ancestors:

576

# If we are possibly a descendent of one of the roots

576

# If we are possibly a descendent of one of the roots

577

# and we haven't already been marked as an ancestor

577

# and we haven't already been marked as an ancestor

578

ancestors[n] = 1 # Mark as ancestor

578

ancestors[n] = 1 # Mark as ancestor

579

# Add non-nullid parents to list of nodes to tag.

579

# Add non-nullid parents to list of nodes to tag.

580

nodestotag.extend([p for p in self.parents(n) if

580

nodestotag.extend([p for p in self.parents(n) if

581

p != nullid])

581

p != nullid])

582

elif n in heads: # We've seen it before, is it a fake head?

582

elif n in heads: # We've seen it before, is it a fake head?

583

# So it is, real heads should not be the ancestors of

583

# So it is, real heads should not be the ancestors of

584

# any other heads.

584

# any other heads.

585

heads.pop(n)

585

heads.pop(n)

586

if not ancestors:

586

if not ancestors:

587

return nonodes

587

return nonodes

588

# Now that we have our set of ancestors, we want to remove any

588

# Now that we have our set of ancestors, we want to remove any

589

# roots that are not ancestors.

589

# roots that are not ancestors.

590

591

# If one of the roots was nullid, everything is included anyway.

591

# If one of the roots was nullid, everything is included anyway.

592

if lowestrev > -1:

592

if lowestrev > -1:

593

# But, since we weren't, let's recompute the lowest rev to not

593

# But, since we weren't, let's recompute the lowest rev to not

594

# include roots that aren't ancestors.

594

# include roots that aren't ancestors.

595

596

# Filter out roots that aren't ancestors of heads

596

# Filter out roots that aren't ancestors of heads

597

roots = [n for n in roots if n in ancestors]

597

roots = [n for n in roots if n in ancestors]

598

# Recompute the lowest revision

598

# Recompute the lowest revision

599

if roots:

599

if roots:

600

lowestrev = min([self.rev(n) for n in roots])

600

lowestrev = min([self.rev(n) for n in roots])

601

else:

601

else:

602

# No more roots? Return empty list

602

# No more roots? Return empty list

603

return nonodes

603

return nonodes

604

else:

604

else:

605

# We are descending from nullid, and don't need to care about

605

# We are descending from nullid, and don't need to care about

606

# any other roots.

606

# any other roots.

607

lowestrev = -1

607

lowestrev = -1

608

roots = [nullid]

608

roots = [nullid]

609

# Transform our roots list into a 'set' (i.e. a dictionary where the

609

# Transform our roots list into a 'set' (i.e. a dictionary where the

610

# values don't matter.

610

# values don't matter.

611

descendents = dict.fromkeys(roots, 1)

611

descendents = dict.fromkeys(roots, 1)

612

# Also, keep the original roots so we can filter out roots that aren't

612

# Also, keep the original roots so we can filter out roots that aren't

613

# 'real' roots (i.e. are descended from other roots).

613

# 'real' roots (i.e. are descended from other roots).

614

roots = descendents.copy()

614

roots = descendents.copy()

615

# Our topologically sorted list of output nodes.

615

# Our topologically sorted list of output nodes.

616

orderedout = []

616

orderedout = []

617

# Don't start at nullid since we don't want nullid in our output list,

617

# Don't start at nullid since we don't want nullid in our output list,

618

# and if nullid shows up in descedents, empty parents will look like

618

# and if nullid shows up in descedents, empty parents will look like

619

# they're descendents.

619

# they're descendents.

620

for r in xrange(max(lowestrev, 0), highestrev + 1):

620

for r in xrange(max(lowestrev, 0), highestrev + 1):

621

n = self.node(r)

621

n = self.node(r)

622

isdescendent = False

622

isdescendent = False

623

if lowestrev == -1: # Everybody is a descendent of nullid

623

if lowestrev == -1: # Everybody is a descendent of nullid

624

isdescendent = True

624

isdescendent = True

625

elif n in descendents:

625

elif n in descendents:

626

# n is already a descendent

626

# n is already a descendent

627

isdescendent = True

627

isdescendent = True

628

# This check only needs to be done here because all the roots

628

# This check only needs to be done here because all the roots

629

# will start being marked is descendents before the loop.

629

# will start being marked is descendents before the loop.

630

if n in roots:

630

if n in roots:

631

# If n was a root, check if it's a 'real' root.

631

# If n was a root, check if it's a 'real' root.

632

p = tuple(self.parents(n))

632

p = tuple(self.parents(n))

633

# If any of its parents are descendents, it's not a root.

633

# If any of its parents are descendents, it's not a root.

634

if (p[0] in descendents) or (p[1] in descendents):

634

if (p[0] in descendents) or (p[1] in descendents):

635

roots.pop(n)

635

roots.pop(n)

636

else:

636

else:

637

p = tuple(self.parents(n))

637

p = tuple(self.parents(n))

638

# A node is a descendent if either of its parents are

638

# A node is a descendent if either of its parents are

639

# descendents. (We seeded the dependents list with the roots

639

# descendents. (We seeded the dependents list with the roots

640

# up there, remember?)

640

# up there, remember?)

641

if (p[0] in descendents) or (p[1] in descendents):

641

if (p[0] in descendents) or (p[1] in descendents):

642

descendents[n] = 1

642

descendents[n] = 1

643

isdescendent = True

643

isdescendent = True

644

if isdescendent and ((ancestors is None) or (n in ancestors)):

644

if isdescendent and ((ancestors is None) or (n in ancestors)):

645

# Only include nodes that are both descendents and ancestors.

645

# Only include nodes that are both descendents and ancestors.

646

orderedout.append(n)

646

orderedout.append(n)

647

if (ancestors is not None) and (n in heads):

647

if (ancestors is not None) and (n in heads):

648

# We're trying to figure out which heads are reachable

648

# We're trying to figure out which heads are reachable

649

# from roots.

649

# from roots.

650

# Mark this head as having been reached

650

# Mark this head as having been reached

651

heads[n] = 1

651

heads[n] = 1

652

elif ancestors is None:

652

elif ancestors is None:

653

# Otherwise, we're trying to discover the heads.

653

# Otherwise, we're trying to discover the heads.

654

# Assume this is a head because if it isn't, the next step

654

# Assume this is a head because if it isn't, the next step

655

# will eventually remove it.

655

# will eventually remove it.

656

heads[n] = 1

656

heads[n] = 1

657

# But, obviously its parents aren't.

657

# But, obviously its parents aren't.

658

for p in self.parents(n):

658

for p in self.parents(n):

659

heads.pop(p, None)

659

heads.pop(p, None)

660

heads = [n for n in heads.iterkeys() if heads[n] != 0]

660

heads = [n for n in heads.iterkeys() if heads[n] != 0]

661

roots = roots.keys()

661

roots = roots.keys()

662

assert orderedout

662

assert orderedout

663

assert roots

663

assert roots

664

assert heads

664

assert heads

665

return (orderedout, roots, heads)

665

return (orderedout, roots, heads)

666

667

def heads(self, start=None):

667

def heads(self, start=None):

668

"""return the list of all nodes that have no children

668

"""return the list of all nodes that have no children

669

670

if start is specified, only heads that are descendants of

670

if start is specified, only heads that are descendants of

671

start will be returned

671

start will be returned

672

673

"""

673

"""

674

if start is None:

674

if start is None:

675

start = nullid

675

start = nullid

676

reachable = {start: 1}

676

reachable = {start: 1}

677

heads = {start: 1}

677

heads = {start: 1}

678

startrev = self.rev(start)

678

startrev = self.rev(start)

679

680

for r in xrange(startrev + 1, self.count()):

680

for r in xrange(startrev + 1, self.count()):

681

n = self.node(r)

681

n = self.node(r)

682

for pn in self.parents(n):

682

for pn in self.parents(n):

683

if pn in reachable:

683

if pn in reachable:

684

reachable[n] = 1

684

reachable[n] = 1

685

heads[n] = 1

685

heads[n] = 1

686

if pn in heads:

686

if pn in heads:

687

del heads[pn]

687

del heads[pn]

688

return heads.keys()

688

return heads.keys()

689

690

def children(self, node):

690

def children(self, node):

691

"""find the children of a given node"""

691

"""find the children of a given node"""

692

c = []

692

c = []

693

p = self.rev(node)

693

p = self.rev(node)

694

for r in range(p + 1, self.count()):

694

for r in range(p + 1, self.count()):

695

n = self.node(r)

695

n = self.node(r)

696

for pn in self.parents(n):

696

for pn in self.parents(n):

697

if pn == node:

697

if pn == node:

698

c.append(n)

698

c.append(n)

699

continue

699

continue

700

elif pn == nullid:

700

elif pn == nullid:

701

continue

701

continue

702

return c

702

return c

703

704

def lookup(self, id):

704

def lookup(self, id):

705

"""locate a node based on revision number or subset of hex nodeid"""

705

"""locate a node based on revision number or subset of hex nodeid"""

706

try:

706

try:

707

rev = int(id)

707

rev = int(id)

708

if str(rev) != id: raise ValueError

708

if str(rev) != id: raise ValueError

709

if rev < 0: rev = self.count() + rev

709

if rev < 0: rev = self.count() + rev

710

if rev < 0 or rev >= self.count(): raise ValueError

710

if rev < 0 or rev >= self.count(): raise ValueError

711

return self.node(rev)

711

return self.node(rev)

712

except (ValueError, OverflowError):

712

except (ValueError, OverflowError):

713

c = []

713

c = []

714

for n in self.nodemap:

714

for n in self.nodemap:

715

if hex(n).startswith(id):

715

if hex(n).startswith(id):

716

c.append(n)

716

c.append(n)

717

if len(c) > 1: raise RevlogError(_("Ambiguous identifier"))

717

if len(c) > 1: raise RevlogError(_("Ambiguous identifier"))

718

if len(c) < 1: raise RevlogError(_("No match found"))

718

if len(c) < 1: raise RevlogError(_("No match found"))

719

return c[0]

719

return c[0]

720

721

return None

721

return None

722

723

def diff(self, a, b):

723

def diff(self, a, b):

724

"""return a delta between two revisions"""

724

"""return a delta between two revisions"""

725

return mdiff.textdiff(a, b)

725

return mdiff.textdiff(a, b)

726

727

def patches(self, t, pl):

727

def patches(self, t, pl):

728

"""apply a list of patches to a string"""

728

"""apply a list of patches to a string"""

729

return mdiff.patches(t, pl)

729

return mdiff.patches(t, pl)

730

731

def chunk(self, rev, df=None, cachelen=4096):

731

def chunk(self, rev, df=None, cachelen=4096):

732

start, length = self.start(rev), self.length(rev)

732

start, length = self.start(rev), self.length(rev)

733

inline = self.inlinedata()

733

inline = self.inlinedata()

734

if inline:

734

if inline:

735

start += (rev + 1) * struct.calcsize(self.indexformat)

735

start += (rev + 1) * struct.calcsize(self.indexformat)

736

end = start + length

736

end = start + length

737

def loadcache(df):

737

def loadcache(df):

738

cache_length = max(cachelen, length) # 4k

738

cache_length = max(cachelen, length) # 4k

739

if not df:

739

if not df:

740

if inline:

740

if inline:

741

df = self.opener(self.indexfile)

741

df = self.opener(self.indexfile)

742

else:

742

else:

743

df = self.opener(self.datafile)

743

df = self.opener(self.datafile)

744

df.seek(start)

744

df.seek(start)

745

self.chunkcache = (start, df.read(cache_length))

745

self.chunkcache = (start, df.read(cache_length))

746

747

if not self.chunkcache:

747

if not self.chunkcache:

748

loadcache(df)

748

loadcache(df)

749

750

cache_start = self.chunkcache[0]

750

cache_start = self.chunkcache[0]

751

cache_end = cache_start + len(self.chunkcache[1])

751

cache_end = cache_start + len(self.chunkcache[1])

752

if start >= cache_start and end <= cache_end:

752

if start >= cache_start and end <= cache_end:

753

# it is cached

753

# it is cached

754

offset = start - cache_start

754

offset = start - cache_start

755

else:

755

else:

756

loadcache(df)

756

loadcache(df)

757

offset = 0

757

offset = 0

758

759

#def checkchunk():

759

#def checkchunk():

760

# df = self.opener(self.datafile)

760

# df = self.opener(self.datafile)

761

# df.seek(start)

761

# df.seek(start)

762

# return df.read(length)

762

# return df.read(length)

763

#assert s == checkchunk()

763

#assert s == checkchunk()

764

return decompress(self.chunkcache[1][offset:offset + length])

764

return decompress(self.chunkcache[1][offset:offset + length])

765

766

def delta(self, node):

766

def delta(self, node):

767

"""return or calculate a delta between a node and its predecessor"""

767

"""return or calculate a delta between a node and its predecessor"""

768

r = self.rev(node)

768

r = self.rev(node)

769

return self.revdiff(r - 1, r)

769

return self.revdiff(r - 1, r)

770

771

def revdiff(self, rev1, rev2):

771

def revdiff(self, rev1, rev2):

772

"""return or calculate a delta between two revisions"""

772

"""return or calculate a delta between two revisions"""

773

b1 = self.base(rev1)

773

b1 = self.base(rev1)

774

b2 = self.base(rev2)

774

b2 = self.base(rev2)

775

if b1 == b2 and rev1 + 1 == rev2:

775

if b1 == b2 and rev1 + 1 == rev2:

776

return self.chunk(rev2)

776

return self.chunk(rev2)

777

else:

777

else:

778

return self.diff(self.revision(self.node(rev1)),

778

return self.diff(self.revision(self.node(rev1)),

779

self.revision(self.node(rev2)))

779

self.revision(self.node(rev2)))

780

781

def revision(self, node):

781

def revision(self, node):

782

"""return an uncompressed revision of a given"""

782

"""return an uncompressed revision of a given"""

783

if node == nullid: return ""

783

if node == nullid: return ""

784

if self.cache and self.cache[0] == node: return self.cache[2]

784

if self.cache and self.cache[0] == node: return self.cache[2]

785

786

# look up what we need to read

786

# look up what we need to read

787

text = None

787

text = None

788

rev = self.rev(node)

788

rev = self.rev(node)

789

base = self.base(rev)

789

base = self.base(rev)

790

791

if self.inlinedata():

791

if self.inlinedata():

792

# we probably have the whole chunk cached

792

# we probably have the whole chunk cached

793

df = None

793

df = None

794

else:

794

else:

795

df = self.opener(self.datafile)

795

df = self.opener(self.datafile)

796

797

# do we have useful data cached?

797

# do we have useful data cached?

798

if self.cache and self.cache[1] >= base and self.cache[1] < rev:

798

if self.cache and self.cache[1] >= base and self.cache[1] < rev:

799

base = self.cache[1]

799

base = self.cache[1]

800

text = self.cache[2]

800

text = self.cache[2]

801

self.loadindex(base, rev + 1)

801

self.loadindex(base, rev + 1)

802

else:

802

else:

803

self.loadindex(base, rev + 1)

803

self.loadindex(base, rev + 1)

804

text = self.chunk(base, df=df)

804

text = self.chunk(base, df=df)

805

806

bins = []

806

bins = []

807

for r in xrange(base + 1, rev + 1):

807

for r in xrange(base + 1, rev + 1):

808

bins.append(self.chunk(r, df=df))

808

bins.append(self.chunk(r, df=df))

809

810

text = self.patches(text, bins)

810

text = self.patches(text, bins)

811

812

p1, p2 = self.parents(node)

812

p1, p2 = self.parents(node)

813

if node != hash(text, p1, p2):

813

if node != hash(text, p1, p2):

814

raise RevlogError(_("integrity check failed on %s:%d")

814

raise RevlogError(_("integrity check failed on %s:%d")

815

% (self.datafile, rev))

815

% (self.datafile, rev))

816

817

self.cache = (node, rev, text)

817

self.cache = (node, rev, text)

818

return text

818

return text

819

820

def checkinlinesize(self, tr, fp=None):

820

def checkinlinesize(self, tr, fp=None):

821

if not self.inlinedata():

821

if not self.inlinedata():

822

return

822

return

823

if not fp:

823

if not fp:

824

fp = self.opener(self.indexfile, 'r')

824

fp = self.opener(self.indexfile, 'r')

825

fp.seek(0, 2)

825

fp.seek(0, 2)

826

size = fp.tell()

826

size = fp.tell()

827

if size < 131072:

827

if size < 131072:

828

return

828

return

829

trinfo = tr.find(self.indexfile)

829

trinfo = tr.find(self.indexfile)

830

if trinfo == None:

830

if trinfo == None:

831

raise RevlogError(_("%s not found in the transaction" %

831

raise RevlogError(_("%s not found in the transaction" %

832

self.indexfile))

832

self.indexfile))

833

834

trindex = trinfo[2]

834

trindex = trinfo[2]

835

dataoff = self.start(trindex)

835

dataoff = self.start(trindex)

836

837

tr.add(self.datafile, dataoff)

837

tr.add(self.datafile, dataoff)

838

df = self.opener(self.datafile, 'w')

838

df = self.opener(self.datafile, 'w')

839

calc = struct.calcsize(self.indexformat)

839

calc = struct.calcsize(self.indexformat)

840

for r in xrange(self.count()):

840

for r in xrange(self.count()):

841

start = self.start(r) + (r + 1) * calc

841

start = self.start(r) + (r + 1) * calc

842

length = self.length(r)

842

length = self.length(r)

843

fp.seek(start)

843

fp.seek(start)

844

d = fp.read(length)

844

d = fp.read(length)

845

df.write(d)

845

df.write(d)

846

fp.close()

846

fp.close()

847

df.close()

847

df.close()

848

fp = self.opener(self.indexfile, 'w', atomictemp=True)

848

fp = self.opener(self.indexfile, 'w', atomictemp=True)

849

self.version &= ~(REVLOGNGINLINEDATA)

849

self.version &= ~(REVLOGNGINLINEDATA)

850

if self.count():

850

if self.count():

851

x = self.index[0]

851

x = self.index[0]

852

e = struct.pack(self.indexformat, *x)[4:]

852

e = struct.pack(self.indexformat, *x)[4:]

853

l = struct.pack(versionformat, self.version)

853

l = struct.pack(versionformat, self.version)

854

fp.write(l)

854

fp.write(l)

855

fp.write(e)

855

fp.write(e)

856

857

for i in xrange(1, self.count()):

857

for i in xrange(1, self.count()):

858

x = self.index[i]

858

x = self.index[i]

859

e = struct.pack(self.indexformat, *x)

859

e = struct.pack(self.indexformat, *x)

860

fp.write(e)

860

fp.write(e)

861

862

# if we don't call rename, the temp file will never replace the

862

# if we don't call rename, the temp file will never replace the

863

# real index

863

# real index

864

fp.rename()

864

fp.rename()

865

866

tr.replace(self.indexfile, trindex * calc)

866

tr.replace(self.indexfile, trindex * calc)

867

self.chunkcache = None

867

self.chunkcache = None

868

869

def addrevision(self, text, transaction, link, p1=None, p2=None, d=None):

869

def addrevision(self, text, transaction, link, p1=None, p2=None, d=None):

870

"""add a revision to the log

870

"""add a revision to the log

871

872

text - the revision data to add

872

text - the revision data to add

873

transaction - the transaction object used for rollback

873

transaction - the transaction object used for rollback

874

link - the linkrev data to add

874

link - the linkrev data to add

875

p1, p2 - the parent nodeids of the revision

875

p1, p2 - the parent nodeids of the revision

876

d - an optional precomputed delta

876

d - an optional precomputed delta

877

"""

877

"""

878

if text is None: text = ""

878

if text is None: text = ""

879

if p1 is None: p1 = self.tip()

879

if p1 is None: p1 = self.tip()

880

if p2 is None: p2 = nullid

880

if p2 is None: p2 = nullid

881

882

node = hash(text, p1, p2)

882

node = hash(text, p1, p2)

883

884

if node in self.nodemap:

884

if node in self.nodemap:

885

return node

885

return node

886

887

n = self.count()

887

n = self.count()

888

t = n - 1

888

t = n - 1

889

890

if n:

890

if n:

891

base = self.base(t)

891

base = self.base(t)

892

start = self.start(base)

892

start = self.start(base)

893

end = self.end(t)

893

end = self.end(t)

894

if not d:

894

if not d:

895

prev = self.revision(self.tip())

895

prev = self.revision(self.tip())

896

d = self.diff(prev, str(text))

896

d = self.diff(prev, str(text))

897

data = compress(d)

897

data = compress(d)

898

l = len(data[1]) + len(data[0])

898

l = len(data[1]) + len(data[0])

899

dist = end - start + l

899

dist = end - start + l

900

901

# full versions are inserted when the needed deltas

901

# full versions are inserted when the needed deltas

902

# become comparable to the uncompressed text

902

# become comparable to the uncompressed text

903

if not n or dist > len(text) * 2:

903

if not n or dist > len(text) * 2:

904

data = compress(text)

904

data = compress(text)

905

l = len(data[1]) + len(data[0])

905

l = len(data[1]) + len(data[0])

906

base = n

906

base = n

907

else:

907

else:

908

base = self.base(t)

908

base = self.base(t)

909

910

offset = 0

910

offset = 0

911

if t >= 0:

911

if t >= 0:

912

offset = self.end(t)

912

offset = self.end(t)

913

914

if self.version == 0:

914

if self.version == 0:

915

e = (offset, l, base, link, p1, p2, node)

915

e = (offset, l, base, link, p1, p2, node)

916

else:

916

else:

917

e = (self.offset_type(offset, 0), l, len(text),

917

e = (self.offset_type(offset, 0), l, len(text),

918

base, link, self.rev(p1), self.rev(p2), node)

918

base, link, self.rev(p1), self.rev(p2), node)

919

920

self.index.append(e)

920

self.index.append(e)

921

self.nodemap[node] = n

921

self.nodemap[node] = n

922

entry = struct.pack(self.indexformat, *e)

922

entry = struct.pack(self.indexformat, *e)

923

924

if not self.inlinedata():

924

if not self.inlinedata():

925

transaction.add(self.datafile, offset)

925

transaction.add(self.datafile, offset)

926

transaction.add(self.indexfile, n * len(entry))

926

transaction.add(self.indexfile, n * len(entry))

927

f = self.opener(self.datafile, "a")

927

f = self.opener(self.datafile, "a")

928

if data[0]:

928

if data[0]:

929

f.write(data[0])

929

f.write(data[0])

930

f.write(data[1])

930

f.write(data[1])

931

f.close()

931

f.close()

932

f = self.opener(self.indexfile, "a")

932

f = self.opener(self.indexfile, "a")

933

else:

933

else:

934

f = self.opener(self.indexfile, "a+")

934

f = self.opener(self.indexfile, "a+")

935

f.seek(0, 2)

935

f.seek(0, 2)

936

transaction.add(self.indexfile, f.tell(), self.count() - 1)

936

transaction.add(self.indexfile, f.tell(), self.count() - 1)

937

938

if len(self.index) == 1 and self.version != 0:

938

if len(self.index) == 1 and self.version != 0:

939

l = struct.pack(versionformat, self.version)

939

l = struct.pack(versionformat, self.version)

940

f.write(l)

940

f.write(l)

941

entry = entry[4:]

941

entry = entry[4:]

942

943

f.write(entry)

943

f.write(entry)

944

945

if self.inlinedata():

945

if self.inlinedata():

946

f.write(data[0])

946

f.write(data[0])

947

f.write(data[1])

947

f.write(data[1])

948

self.checkinlinesize(transaction, f)

948

self.checkinlinesize(transaction, f)

949

950

self.cache = (node, n, text)

950

self.cache = (node, n, text)

951

return node

951

return node

952

953

def ancestor(self, a, b):

953

def ancestor(self, a, b):

954

"""calculate the least common ancestor of nodes a and b"""

954

"""calculate the least common ancestor of nodes a and b"""

955

956

# start with some short cuts for the linear cases

956

# start with some short cuts for the linear cases

957

if a == b:

957

if a == b:

958

return a

958

return a

959

ra = self.rev(a)

959

ra = self.rev(a)

960

rb = self.rev(b)

960

rb = self.rev(b)

961

if ra < rb:

961

if ra < rb:

962

last = b

962

last = b

963

first = a

963

first = a

964

else:

964

else:

965

last = a

965

last = a

966

first = b

966

first = b

967

968

# reachable won't include stop in the list, so we have to use a parent

968

# reachable won't include stop in the list, so we have to use a parent

969

reachable = self.reachable(last, stop=self.parents(first)[0])

969

reachable = self.reachable(last, stop=self.parents(first)[0])

970

if first in reachable:

970

if first in reachable:

971

return first

971

return first

972

973

# calculate the distance of every node from root

973

# calculate the distance of every node from root

974

dist = {nullid: 0}

974

dist = {nullid: 0}

975

for i in xrange(self.count()):

975

for i in xrange(self.count()):

976

n = self.node(i)

976

n = self.node(i)

977

p1, p2 = self.parents(n)

977

p1, p2 = self.parents(n)

978

dist[n] = max(dist[p1], dist[p2]) + 1

978

dist[n] = max(dist[p1], dist[p2]) + 1

979

980

# traverse ancestors in order of decreasing distance from root

980

# traverse ancestors in order of decreasing distance from root

981

def ancestors(node):

981

def ancestors(node):

982

# we store negative distances because heap returns smallest member

982

# we store negative distances because heap returns smallest member

983

h = [(-dist[node], node)]

983

h = [(-dist[node], node)]

984

seen = {}

984

seen = {}

985

while h:

985

while h:

986

d, n = heapq.heappop(h)

986

d, n = heapq.heappop(h)

987

if n not in seen:

987

if n not in seen:

988

seen[n] = 1

988

seen[n] = 1

989

yield (-d, n)

989

yield (-d, n)

990

for p in self.parents(n):

990

for p in self.parents(n):

991

heapq.heappush(h, (-dist[p], p))

991

heapq.heappush(h, (-dist[p], p))

992

993

def generations(node):

993

def generations(node):

994

sg, s = None, {}

994

sg, s = None, {}

995

for g,n in ancestors(node):

995

for g,n in ancestors(node):

996

if g != sg:

996

if g != sg:

997

if sg:

997

if sg:

998

yield sg, s

998

yield sg, s

999

sg, s = g, {n:1}

999

sg, s = g, {n:1}

1000

else:

1000

else:

1001

s[n] = 1

1001

s[n] = 1

1002

yield sg, s

1002

yield sg, s

1003

1004

x = generations(a)

1004

x = generations(a)

1005

y = generations(b)

1005

y = generations(b)

1006

gx = x.next()

1006

gx = x.next()

1007

gy = y.next()

1007

gy = y.next()

1008

1009

# increment each ancestor list until it is closer to root than

1009

# increment each ancestor list until it is closer to root than

1010

# the other, or they match

1010

# the other, or they match

1011

while 1:

1011

while 1:

1012

#print "ancestor gen %s %s" % (gx[0], gy[0])

1012

#print "ancestor gen %s %s" % (gx[0], gy[0])

1013

if gx[0] == gy[0]:

1013

if gx[0] == gy[0]:

1014

# find the intersection

1014

# find the intersection

1015

i = [ n for n in gx[1] if n in gy[1] ]

1015

i = [ n for n in gx[1] if n in gy[1] ]

1016

if i:

1016

if i:

1017

return i[0]

1017

return i[0]

1018

else:

1018

else:

1019

#print "next"

1019

#print "next"

1020

gy = y.next()

1020

gy = y.next()

1021

gx = x.next()

1021

gx = x.next()

1022

elif gx[0] < gy[0]:

1022

elif gx[0] < gy[0]:

1023

#print "next y"

1023

#print "next y"

1024

gy = y.next()

1024

gy = y.next()

1025

else:

1025

else:

1026

#print "next x"

1026

#print "next x"

1027

gx = x.next()

1027

gx = x.next()

1028

1029

def group(self, nodelist, lookup, infocollect=None):

1029

def group(self, nodelist, lookup, infocollect=None):

1030

"""calculate a delta group

1030

"""calculate a delta group

1031

1032

Given a list of changeset revs, return a set of deltas and

1032

Given a list of changeset revs, return a set of deltas and

1033

metadata corresponding to nodes. the first delta is

1033

metadata corresponding to nodes. the first delta is

1034

parent(nodes[0]) -> nodes[0] the receiver is guaranteed to

1034

parent(nodes[0]) -> nodes[0] the receiver is guaranteed to

1035

have this parent as it has all history before these

1035

have this parent as it has all history before these

1036

changesets. parent is parent[0]

1036

changesets. parent is parent[0]

1037

"""

1037

"""

1038

revs = [self.rev(n) for n in nodelist]

1038

revs = [self.rev(n) for n in nodelist]

1039

1040

# if we don't have any revisions touched by these changesets, bail

1040

# if we don't have any revisions touched by these changesets, bail

1041

if not revs:

1041

if not revs:

1042

yield changegroup.closechunk()

1042

yield changegroup.closechunk()

1043

return

1043

return

1044

1045

# add the parent of the first rev

1045

# add the parent of the first rev

1046

p = self.parents(self.node(revs[0]))[0]

1046

p = self.parents(self.node(revs[0]))[0]

1047

revs.insert(0, self.rev(p))

1047

revs.insert(0, self.rev(p))

1048

1049

# build deltas

1049

# build deltas

1050

for d in xrange(0, len(revs) - 1):

1050

for d in xrange(0, len(revs) - 1):

1051

a, b = revs[d], revs[d + 1]

1051

a, b = revs[d], revs[d + 1]

1052

nb = self.node(b)

1052

nb = self.node(b)

1053

1054

if infocollect is not None:

1054

if infocollect is not None:

1055

infocollect(nb)

1055

infocollect(nb)

1056

1057

d = self.revdiff(a, b)

1057

d = self.revdiff(a, b)

1058

p = self.parents(nb)

1058

p = self.parents(nb)

1059

meta = nb + p[0] + p[1] + lookup(nb)

1059

meta = nb + p[0] + p[1] + lookup(nb)

1060

yield changegroup.genchunk("%s%s" % (meta, d))

1060

yield changegroup.genchunk("%s%s" % (meta, d))

1061

1062

yield changegroup.closechunk()

1062

yield changegroup.closechunk()

1063

1064

def addgroup(self, revs, linkmapper, transaction, unique=0):

1064

def addgroup(self, revs, linkmapper, transaction, unique=0):

1065

"""

1065

"""

1066

add a delta group

1066

add a delta group

1067

1068

given a set of deltas, add them to the revision log. the

1068

given a set of deltas, add them to the revision log. the

1069

first delta is against its parent, which should be in our

1069

first delta is against its parent, which should be in our

1070

log, the rest are against the previous delta.

1070

log, the rest are against the previous delta.

1071

"""

1071

"""

1072

1073

#track the base of the current delta log

1073

#track the base of the current delta log

1074

r = self.count()

1074

r = self.count()

1075

t = r - 1

1075

t = r - 1

1076

node = None

1076

node = None

1077

1078

base = prev = -1

1078

base = prev = -1

1079

start = end = textlen = 0

1079

start = end = textlen = 0

1080

if r:

1080

if r:

1081

end = self.end(t)

1081

end = self.end(t)

1082

1083

ifh = self.opener(self.indexfile, "a+")

1083

ifh = self.opener(self.indexfile, "a+")

1084

ifh.seek(0, 2)

1084

ifh.seek(0, 2)

1085

transaction.add(self.indexfile, ifh.tell(), self.count())

1085

transaction.add(self.indexfile, ifh.tell(), self.count())

1086

if self.inlinedata():

1086

if self.inlinedata():

1087

dfh = None

1087

dfh = None

1088

else:

1088

else:

1089

transaction.add(self.datafile, end)

1089

transaction.add(self.datafile, end)

1090

dfh = self.opener(self.datafile, "a")

1090

dfh = self.opener(self.datafile, "a")

1091

1092

# loop through our set of deltas

1092

# loop through our set of deltas

1093

chain = None

1093

chain = None

1094

for chunk in revs:

1094

for chunk in revs:

1095

node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80])

1095

node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80])

1096

link = linkmapper(cs)

1096

link = linkmapper(cs)

1097

if node in self.nodemap:

1097

if node in self.nodemap:

1098

# this can happen if two branches make the same change

1098

# this can happen if two branches make the same change

1099

# if unique:

1099

# if unique:

1100

# raise RevlogError(_("already have %s") % hex(node[:4]))

1100

# raise RevlogError(_("already have %s") % hex(node[:4]))

1101

chain = node

1101

chain = node

1102

continue

1102

continue

1103

delta = chunk[80:]

1103

delta = chunk[80:]

1104

1105

for p in (p1, p2):

1105

for p in (p1, p2):

1106

if not p in self.nodemap:

1106

if not p in self.nodemap:

1107

raise RevlogError(_("unknown parent %s") % short(p1))

1107

raise RevlogError(_("unknown parent %s") % short(p1))

1108

1109

if not chain:

1109

if not chain:

1110

# retrieve the parent revision of the delta chain

1110

# retrieve the parent revision of the delta chain

1111

chain = p1

1111

chain = p1

1112

if not chain in self.nodemap:

1112

if not chain in self.nodemap:

1113

raise RevlogError(_("unknown base %s") % short(chain[:4]))

1113

raise RevlogError(_("unknown base %s") % short(chain[:4]))

1114

1115

# full versions are inserted when the needed deltas become

1115

# full versions are inserted when the needed deltas become

1116

# comparable to the uncompressed text or when the previous

1116

# comparable to the uncompressed text or when the previous

1117

# version is not the one we have a delta against. We use

1117

# version is not the one we have a delta against. We use

1118

# the size of the previous full rev as a proxy for the

1118

# the size of the previous full rev as a proxy for the

1119

# current size.

1119

# current size.

1120

1121

if chain == prev:

1121

if chain == prev:

1122

tempd = compress(delta)

1122

tempd = compress(delta)

1123

cdelta = tempd[0] + tempd[1]

1123

cdelta = tempd[0] + tempd[1]

1124

textlen = mdiff.patchedsize(textlen, delta)

1124

textlen = mdiff.patchedsize(textlen, delta)

1125

1126

if chain != prev or (end - start + len(cdelta)) > textlen * 2:

1126

if chain != prev or (end - start + len(cdelta)) > textlen * 2:

1127

# flush our writes here so we can read it in revision

1127

# flush our writes here so we can read it in revision

1128

if dfh:

1128

if dfh:

1129

dfh.flush()

1129

dfh.flush()

1130

ifh.flush()

1130

ifh.flush()

1131

text = self.revision(chain)

1131

text = self.revision(chain)

1132

text = self.patches(text, [delta])

1132

text = self.patches(text, [delta])

1133

chk = self.addrevision(text, transaction, link, p1, p2)

1133

chk = self.addrevision(text, transaction, link, p1, p2)

1134

if chk != node:

1134

if chk != node:

1135

raise RevlogError(_("consistency error adding group"))

1135

raise RevlogError(_("consistency error adding group"))

1136

textlen = len(text)

1136

textlen = len(text)

1137

else:

1137

else:

1138

if self.version == 0:

1138

if self.version == 0:

1139

e = (end, len(cdelta), base, link, p1, p2, node)

1139

e = (end, len(cdelta), base, link, p1, p2, node)

1140

else:

1140

else:

1141

e = (self.offset_type(end, 0), len(cdelta), textlen, base,

1141

e = (self.offset_type(end, 0), len(cdelta), textlen, base,

1142

link, self.rev(p1), self.rev(p2), node)

1142

link, self.rev(p1), self.rev(p2), node)

1143

self.index.append(e)

1143

self.index.append(e)

1144

self.nodemap[node] = r

1144

self.nodemap[node] = r

1145

if self.inlinedata():

1145

if self.inlinedata():

1146

ifh.write(struct.pack(self.indexformat, *e))

1146

ifh.write(struct.pack(self.indexformat, *e))

1147

ifh.write(cdelta)

1147

ifh.write(cdelta)

1148

self.checkinlinesize(transaction, ifh)

1148

self.checkinlinesize(transaction, ifh)

1149

if not self.inlinedata():

1149

if not self.inlinedata():

1150

dfh = self.opener(self.datafile, "a")

1150

dfh = self.opener(self.datafile, "a")

1151

ifh = self.opener(self.indexfile, "a")

1151

ifh = self.opener(self.indexfile, "a")

1152

else:

1152

else:

1153

if not dfh:

1153

if not dfh:

1154

# addrevision switched from inline to conventional

1154

# addrevision switched from inline to conventional

1155

# reopen the index

1155

# reopen the index

1156

dfh = self.opener(self.datafile, "a")

1156

dfh = self.opener(self.datafile, "a")

1157

ifh = self.opener(self.indexfile, "a")

1157

ifh = self.opener(self.indexfile, "a")

1158

dfh.write(cdelta)

1158

dfh.write(cdelta)

1159

ifh.write(struct.pack(self.indexformat, *e))

1159

ifh.write(struct.pack(self.indexformat, *e))

1160

1161

t, r, chain, prev = r, r + 1, node, node

1161

t, r, chain, prev = r, r + 1, node, node

1162

base = self.base(t)

1162

base = self.base(t)

1163

start = self.start(base)

1163

start = self.start(base)

1164

end = self.end(t)

1164

end = self.end(t)

1165

1166

if node is None:

1166

if node is None:

1167

raise RevlogError(_("group to be added is empty"))

1167

raise RevlogError(_("group to be added is empty"))

1168

return node

1168

return node

1169

1170

def strip(self, rev, minlink):

1170

def strip(self, rev, minlink):

1171

if self.count() == 0 or rev >= self.count():

1171

if self.count() == 0 or rev >= self.count():

1172

return

1172

return

1173

1174

if isinstance(self.index, lazyindex):

1174

if isinstance(self.index, lazyindex):

1175

self.loadindexmap()

1175

self.loadindexmap()

1176

1177

# When stripping away a revision, we need to make sure it

1177

# When stripping away a revision, we need to make sure it

1178

# does not actually belong to an older changeset.

1178

# does not actually belong to an older changeset.

1179

# The minlink parameter defines the oldest revision

1179

# The minlink parameter defines the oldest revision

1180

# we're allowed to strip away.

1180

# we're allowed to strip away.

1181

while minlink > self.index[rev][-4]:

1181

while minlink > self.index[rev][-4]:

1182

rev += 1

1182

rev += 1

1183

if rev >= self.count():

1183

if rev >= self.count():

1184

return

1184

return

1185

1186

# first truncate the files on disk

1186

# first truncate the files on disk

1187

end = self.start(rev)

1187

end = self.start(rev)

1188

if not self.inlinedata():

1188

if not self.inlinedata():

1189

df = self.opener(self.datafile, "a")

1189

df = self.opener(self.datafile, "a")

1190

df.truncate(end)

1190

df.truncate(end)

1191

end = rev * struct.calcsize(self.indexformat)

1191

end = rev * struct.calcsize(self.indexformat)

1192

else:

1192

else:

1193

end += rev * struct.calcsize(self.indexformat)

1193

end += rev * struct.calcsize(self.indexformat)

1194

1195

indexf = self.opener(self.indexfile, "a")

1195

indexf = self.opener(self.indexfile, "a")

1196

indexf.truncate(end)

1196

indexf.truncate(end)

1197

1198

# then reset internal state in memory to forget those revisions

1198

# then reset internal state in memory to forget those revisions

1199

self.cache = None

1199

self.cache = None

1200

self.chunkcache = None

1200

self.chunkcache = None

1201

for x in xrange(rev, self.count()):

1201

for x in xrange(rev, self.count()):

1202

del self.nodemap[self.node(x)]

1202

del self.nodemap[self.node(x)]

1203

1204

del self.index[rev:]

1204

del self.index[rev:]

1205

1206

def checksize(self):

1206

def checksize(self):

1207

expected = 0

1207

expected = 0

1208

if self.count():

1208

if self.count():

1209

expected = self.end(self.count() - 1)

1209

expected = self.end(self.count() - 1)

1210

1211

try:

1211

try:

1212

f = self.opener(self.datafile)

1212

f = self.opener(self.datafile)

1213

f.seek(0, 2)

1213

f.seek(0, 2)

1214

actual = f.tell()

1214

actual = f.tell()

1215

dd = actual - expected

1215

dd = actual - expected

1216

except IOError, inst:

1216

except IOError, inst:

1217

if inst.errno != errno.ENOENT:

1217

if inst.errno != errno.ENOENT:

1218

raise

1218

raise

1219

dd = 0

1219

dd = 0

1220

1221

try:

1221

try:

1222

f = self.opener(self.indexfile)

1222

f = self.opener(self.indexfile)

1223

f.seek(0, 2)

1223

f.seek(0, 2)

1224

actual = f.tell()

1224

actual = f.tell()

1225

s = struct.calcsize(self.indexformat)

1225

s = struct.calcsize(self.indexformat)

1226

i = actual / s

1226

i = actual / s

1227

di = actual - (i * s)

1227

di = actual - (i * s)

1228

if self.inlinedata():

1228

if self.inlinedata():

1229

databytes = 0

1229

databytes = 0

1230

for r in xrange(self.count()):

1230

for r in xrange(self.count()):

1231

databytes += self.length(r)

1231

databytes += self.length(r)

1232

dd = 0

1232

dd = 0

1233

di = actual - self.count() * s - databytes

1233

di = actual - self.count() * s - databytes

1234

except IOError, inst:

1234

except IOError, inst:

1235

if inst.errno != errno.ENOENT:

1235

if inst.errno != errno.ENOENT:

1236

raise

1236

raise

1237

di = 0

1237

di = 0

1238

1239

return (dd, di)

1239

return (dd, di)

1240

1241

             # httprangereader.py - just what it says
             #
             # Copyright 2005 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms
             # of the GNU General Public License, incorporated herein by reference.
             import byterange, urllib2
             class httprangereader(object):
                 def __init__(self, url):
                     self.url = url
                     self.pos = 0
                 def seek(self, pos):
                     self.pos = pos
                 def read(self, bytes=None):
                     opener = urllib2.build_opener(byterange.HTTPRangeHandler())
                     urllib2.install_opener(opener)
                     req = urllib2.Request(self.url)
                     end = ''
-                    if bytes: end = self.pos + bytes
+                    if bytes:
+                        end = self.pos + bytes - 1
                     req.add_header('Range', 'bytes=%d-%s' % (self.pos, end))
                     f = urllib2.urlopen(req)
-                    return f.read()
+                    return f.read(bytes)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             """
             revlog.py - storage back-end for mercurial
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches
             Copyright 2005 Matt Mackall <mpm@selenic.com>
             This software may be used and distributed according to the terms
             of the GNU General Public License, incorporated herein by reference.
             """
             from node import *
             from i18n import gettext as _
             from demandload import demandload
             demandload(globals(), "binascii changegroup errno heapq mdiff os")
             demandload(globals(), "sha struct zlib")
             # revlog version strings
             REVLOGV0 = 0
             REVLOGNG = 1
             # revlog flags
             REVLOGNGINLINEDATA = (1 << 16)
             def flagstr(flag):
                 if flag == "inline":
                     return REVLOGNGINLINEDATA
                 raise RevlogError(_("unknown revlog flag %s" % flag))
             def hash(text, p1, p2):
                 """generate a hash from the given text and its parent hashes
                 This hash combines both the current file contents and its history
                 in a manner that makes it easy to distinguish nodes with the same
                 content in the revision graph.
                 """
                 l = [p1, p2]
                 l.sort()
                 s = sha.new(l[0])
                 s.update(l[1])
                 s.update(text)
                 return s.digest()
             def compress(text):
                 """ generate a possibly-compressed representation of text """
                 if not text: return ("", text)
                 if len(text) < 44:
                     if text[0] == '\0': return ("", text)
                     return ('u', text)
                 bin = zlib.compress(text)
                 if len(bin) > len(text):
                     if text[0] == '\0': return ("", text)
                     return ('u', text)
                 return ("", bin)
             def decompress(bin):
                 """ decompress the given input """
                 if not bin: return bin
                 t = bin[0]
                 if t == '\0': return bin
                 if t == 'x': return zlib.decompress(bin)
                 if t == 'u': return bin[1:]
                 raise RevlogError(_("unknown compression type %r") % t)
             indexformatv0 = ">4l20s20s20s"
             v0shaoffset = 56
             # index ng:
             # 6 bytes offset
             # 2 bytes flags
             # 4 bytes compressed length
             # 4 bytes uncompressed length
             # 4 bytes: base rev
             # 4 bytes link rev
             # 4 bytes parent 1 rev
             # 4 bytes parent 2 rev
             # 32 bytes: nodeid
             indexformatng = ">Qiiiiii20s12x"
             ngshaoffset = 32
             versionformat = ">i"
             class lazyparser(object):
                 """
                 this class avoids the need to parse the entirety of large indices
                 """
                 def __init__(self, dataf, size, indexformat, shaoffset):
                     self.dataf = dataf
                     self.format = indexformat
                     self.s = struct.calcsize(indexformat)
                     self.indexformat = indexformat
                     self.datasize = size
                     self.l = size/self.s
                     self.index = [None] * self.l
                     self.map = {nullid: -1}
                     self.allmap = 0
                     self.all = 0
                     self.mapfind_count = 0
                     self.shaoffset = shaoffset
                 def loadmap(self):
                     """
                     during a commit, we need to make sure the rev being added is
                     not a duplicate.  This requires loading the entire index,
                     which is fairly slow.  loadmap can load up just the node map,
                     which takes much less time.
                     """
                     if self.allmap: return
                     start = 0
                     end = self.datasize
                     self.allmap = 1
                     cur = 0
                     count = 0
                     blocksize = self.s * 256
                     self.dataf.seek(0)
                     while cur < end:
                         data = self.dataf.read(blocksize)
                         off = 0
                         for x in xrange(256):
                             n = data[off + self.shaoffset:off + self.shaoffset + 20]
                             self.map[n] = count
                             count += 1
                             if count >= self.l:
                                 break
                             off += self.s
                         cur += blocksize
                 def loadblock(self, blockstart, blocksize, data=None):
                     if self.all: return
                     if data is None:
                         self.dataf.seek(blockstart)
                         data = self.dataf.read(blocksize)
                     lend = len(data) / self.s
                     i = blockstart / self.s
                     off = 0
                     for x in xrange(lend):
                         if self.index[i + x] == None:
                             b = data[off : off + self.s]
                             self.index[i + x] = b
                             n = b[self.shaoffset:self.shaoffset + 20]
                             self.map[n] = i + x
                         off += self.s
                 def findnode(self, node):
                     """search backwards through the index file for a specific node"""
                     if self.allmap: return None
                     # hg log will cause many many searches for the manifest
                     # nodes.  After we get called a few times, just load the whole
                     # thing.
                     if self.mapfind_count > 8:
                         self.loadmap()
                         if node in self.map:
                             return node
                         return None
                     self.mapfind_count += 1
                     last = self.l - 1
                     while self.index[last] != None:
                         if last == 0:
                             self.all = 1
                             self.allmap = 1
                             return None
                         last -= 1
                     end = (last + 1) * self.s
                     blocksize = self.s * 256
                     while end >= 0:
                         start = max(end - blocksize, 0)
                         self.dataf.seek(start)
                         data = self.dataf.read(end - start)
                         findend = end - start
                         while True:
                             # we're searching backwards, so weh have to make sure
                             # we don't find a changeset where this node is a parent
                             off = data.rfind(node, 0, findend)
                             findend = off
                             if off >= 0:
                                 i = off / self.s
                                 off = i * self.s
                                 n = data[off + self.shaoffset:off + self.shaoffset + 20]
                                 if n == node:
                                     self.map[n] = i + start / self.s
                                     return node
                             else:
                                 break
                         end -= blocksize
                     return None
                 def loadindex(self, i=None, end=None):
                     if self.all: return
                     all = False
                     if i == None:
                         blockstart = 0
                         blocksize = (512 / self.s) * self.s
                         end = self.datasize
                         all = True
                     else:
                         if end:
                             blockstart = i * self.s
                             end = end * self.s
                             blocksize = end - blockstart
                         else:
                             blockstart = (i & ~(32)) * self.s
                             blocksize = self.s * 64
                             end = blockstart + blocksize
                     while blockstart < end:
                         self.loadblock(blockstart, blocksize)
                         blockstart += blocksize
                     if all: self.all = True
             class lazyindex(object):
                 """a lazy version of the index array"""
                 def __init__(self, parser):
                     self.p = parser
                 def __len__(self):
                     return len(self.p.index)
                 def load(self, pos):
                     if pos < 0:
                         pos += len(self.p.index)
                     self.p.loadindex(pos)
                     return self.p.index[pos]
                 def __getitem__(self, pos):
                     ret = self.p.index[pos] or self.load(pos)
                     if isinstance(ret, str):
                         ret = struct.unpack(self.p.indexformat, ret)
                     return ret
                 def __setitem__(self, pos, item):
                     self.p.index[pos] = item
                 def __delitem__(self, pos):
                     del self.p.index[pos]
                 def append(self, e):
                     self.p.index.append(e)
             class lazymap(object):
                 """a lazy version of the node map"""
                 def __init__(self, parser):
                     self.p = parser
                 def load(self, key):
                     n = self.p.findnode(key)
                     if n == None:
                         raise KeyError(key)
                 def __contains__(self, key):
                     if key in self.p.map:
                         return True
                     self.p.loadmap()
                     return key in self.p.map
                 def __iter__(self):
                     yield nullid
                     for i in xrange(self.p.l):
                         ret = self.p.index[i]
                         if not ret:
                             self.p.loadindex(i)
                             ret = self.p.index[i]
                         if isinstance(ret, str):
                             ret = struct.unpack(self.p.indexformat, ret)
                         yield ret[-1]
                 def __getitem__(self, key):
                     try:
                         return self.p.map[key]
                     except KeyError:
                         try:
                             self.load(key)
                             return self.p.map[key]
                         except KeyError:
                             raise KeyError("node " + hex(key))
                 def __setitem__(self, key, val):
                     self.p.map[key] = val
                 def __delitem__(self, key):
                     del self.p.map[key]
             class RevlogError(Exception): pass
             class revlog(object):
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, includings its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 """
                 def __init__(self, opener, indexfile, datafile, defversion=0):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     """
                     self.indexfile = indexfile
                     self.datafile = datafile
                     self.opener = opener
                     self.indexstat = None
                     self.cache = None
                     self.chunkcache = None
                     self.defversion = defversion
                     self.load()
                 def load(self):
                     v = self.defversion
                     try:
                         f = self.opener(self.indexfile)
                         i = f.read(4)
                         f.seek(0)
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         i = ""
                     else:
                         try:
                             st = os.fstat(f.fileno())
                         except AttributeError, inst:
                             st = None
                         else:
                             oldst = self.indexstat
                             if (oldst and st.st_dev == oldst.st_dev
                                 and st.st_ino == oldst.st_ino
                                 and st.st_mtime == oldst.st_mtime
                                 and st.st_ctime == oldst.st_ctime):
                                 return
                             self.indexstat = st
-                            if len(i) > 0:
+                        if len(i) > 0:
-                                v = struct.unpack(versionformat, i)[0]
+                            v = struct.unpack(versionformat, i)[0]
                     flags = v & ~0xFFFF
                     fmt = v & 0xFFFF
                     if fmt == 0:
                         if flags:
                             raise RevlogError(_("index %s invalid flags %x for format v0" %
                                                (self.indexfile, flags)))
                     elif fmt == REVLOGNG:
                         if flags & ~REVLOGNGINLINEDATA:
                             raise RevlogError(_("index %s invalid flags %x for revlogng" %
                                                (self.indexfile, flags)))
                     else:
                         raise RevlogError(_("index %s invalid format %d" %
                                            (self.indexfile, fmt)))
                     self.version = v
                     if v == 0:
                         self.indexformat = indexformatv0
                         shaoffset = v0shaoffset
                     else:
                         self.indexformat = indexformatng
                         shaoffset = ngshaoffset
                     if i:
                         if not self.inlinedata() and st and st.st_size > 10000:
                             # big index, let's parse it on demand
                             parser = lazyparser(f, st.st_size, self.indexformat, shaoffset)
                             self.index = lazyindex(parser)
                             self.nodemap = lazymap(parser)
                         else:
                             i = f.read()
                             self.parseindex(i)
                         if self.inlinedata():
                             # we've already got the entire data file read in, save it
                             # in the chunk data
                             self.chunkcache = (0, i)
                         if self.version != 0:
                             e = list(self.index[0])
                             type = self.ngtype(e[0])
                             e[0] = self.offset_type(0, type)
                             self.index[0] = e
                     else:
                         self.nodemap = { nullid: -1}
                         self.index = []
                 def parseindex(self, data):
                     s = struct.calcsize(self.indexformat)
                     l = len(data)
                     self.index = []
                     self.nodemap =  {nullid: -1}
                     inline = self.inlinedata()
                     off = 0
                     n = 0
                     while off < l:
                         e = struct.unpack(self.indexformat, data[off:off + s])
                         self.index.append(e)
                         self.nodemap[e[-1]] = n
                         n += 1
                         off += s
                         if inline:
                             off += e[1]
                 def ngoffset(self, q):
                     if q & 0xFFFF:
                         raise RevlogError(_('%s: incompatible revision flag %x') %
                                            (self.indexfile, type))
                     return long(q >> 16)
                 def ngtype(self, q):
                     return int(q & 0xFFFF)
                 def offset_type(self, offset, type):
                     return long(long(offset) << 16 | type)
                 def loadindex(self, start, end):
                     """load a block of indexes all at once from the lazy parser"""
                     if isinstance(self.index, lazyindex):
                         self.index.p.loadindex(start, end)
                 def loadindexmap(self):
                     """loads both the map and the index from the lazy parser"""
                     if isinstance(self.index, lazyindex):
                         p = self.index.p
                         p.loadindex()
                         self.nodemap = p.map
                 def loadmap(self):
                     """loads the map from the lazy parser"""
                     if isinstance(self.nodemap, lazymap):
                         self.nodemap.p.loadmap()
                         self.nodemap = self.nodemap.p.map
                 def inlinedata(self): return self.version & REVLOGNGINLINEDATA
                 def tip(self): return self.node(len(self.index) - 1)
                 def count(self): return len(self.index)
                 def node(self, rev):
                     return (rev < 0) and nullid or self.index[rev][-1]
                 def rev(self, node):
                     try:
                         return self.nodemap[node]
                     except KeyError:
                         raise RevlogError(_('%s: no node %s') % (self.indexfile, hex(node)))
                 def linkrev(self, node): return self.index[self.rev(node)][-4]
                 def parents(self, node):
                     if node == nullid: return (nullid, nullid)
                     r = self.rev(node)
                     d = self.index[r][-3:-1]
                     if self.version == 0:
                         return d
                     return [ self.node(x) for x in d ]
                 def start(self, rev):
                     if rev < 0:
                         return -1
                     if self.version != 0:
                         return self.ngoffset(self.index[rev][0])
                     return self.index[rev][0]
                 def end(self, rev): return self.start(rev) + self.length(rev)
                 def size(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = -1
                     if self.version != 0:
                         l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.revision(self.node(rev))
                     return len(t)
                     # alternate implementation, The advantage to this code is it
                     # will be faster for a single revision.  But, the results are not
                     # cached, so finding the size of every revision will be slower.
                     """
                     if self.cache and self.cache[1] == rev:
                         return len(self.cache[2])
                     base = self.base(rev)
                     if self.cache and self.cache[1] >= base and self.cache[1] < rev:
                         base = self.cache[1]
                         text = self.cache[2]
                     else:
                         text = self.revision(self.node(base))
                     l = len(text)
                     for x in xrange(base + 1, rev + 1):
                         l = mdiff.patchedsize(l, self.chunk(x))
                     return l
                     """
                 def length(self, rev):
                     if rev < 0:
                         return 0
                     else:
                         return self.index[rev][1]
                 def base(self, rev): return (rev < 0) and rev or self.index[rev][-5]
                 def reachable(self, rev, stop=None):
                     reachable = {}
                     visit = [rev]
                     reachable[rev] = 1
                     if stop:
                         stopn = self.rev(stop)
                     else:
                         stopn = 0
                     while visit:
                         n = visit.pop(0)
                         if n == stop:
                             continue
                         if n == nullid:
                             continue
                         for p in self.parents(n):
                             if self.rev(p) < stopn:
                                 continue
                             if p not in reachable:
                                 reachable[p] = 1
                                 visit.append(p)
                     return reachable
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a tuple containing three elements. Elements 1 and 2 contain
                     a final list bases and heads after all the unreachable ones have been
                     pruned.  Element 0 contains a topologically sorted list of all
                     nodes that satisfy these constraints:
 . All nodes must be descended from a node in roots (the nodes on
                        roots are considered descended from themselves).
 . All nodes must also be ancestors of a node in heads (the nodes in
                        heads are considered to be their own ancestors).
                     If roots is unspecified, nullid is assumed as the only root.
                     If heads is unspecified, it is taken to be the output of the
                     heads method (i.e. a list of all nodes in the repository that
                     have no children)."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [nullid] # Everybody's a descendent of nullid
                         lowestrev = -1
                     if (lowestrev == -1) and (heads is None):
                         # We want _all_ the nodes!
                         return ([self.node(r) for r in xrange(0, self.count())],
                                 [nullid], list(self.heads()))
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = self.count() - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = {}
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = heads[:]
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, 0)
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendent of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors[n] = 1 # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.extend([p for p in self.parents(n) if
                                                        p != nullid])
                                 elif n in heads: # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > -1:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [n for n in roots if n in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(n) for n in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = -1
                             roots = [nullid]
                     # Transform our roots list into a 'set' (i.e. a dictionary where the
                     # values don't matter.
                     descendents = dict.fromkeys(roots, 1)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendents.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descedents, empty parents will look like
                     # they're descendents.
                     for r in xrange(max(lowestrev, 0), highestrev + 1):
                         n = self.node(r)
                         isdescendent = False
                         if lowestrev == -1:  # Everybody is a descendent of nullid
                             isdescendent = True
                         elif n in descendents:
                             # n is already a descendent
                             isdescendent = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendents before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendents, it's not a root.
                                 if (p[0] in descendents) or (p[1] in descendents):
                                     roots.pop(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendent if either of its parents are
                             # descendents.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendents) or (p[1] in descendents):
                                 descendents[n] = 1
                                 isdescendent = True
                         if isdescendent and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendents and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = 1
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = 1
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [n for n in heads.iterkeys() if heads[n] != 0]
                     roots = roots.keys()
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def heads(self, start=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     """
                     if start is None:
                         start = nullid
                     reachable = {start: 1}
                     heads = {start: 1}
                     startrev = self.rev(start)
                     for r in xrange(startrev + 1, self.count()):
                         n = self.node(r)
                         for pn in self.parents(n):
                             if pn in reachable:
                                 reachable[n] = 1
                                 heads[n] = 1
                             if pn in heads:
                                 del heads[pn]
                     return heads.keys()
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in range(p + 1, self.count()):
                         n = self.node(r)
                         for pn in self.parents(n):
                             if pn == node:
                                 c.append(n)
                                 continue
                             elif pn == nullid:
                                 continue
                     return c
                 def lookup(self, id):
                     """locate a node based on revision number or subset of hex nodeid"""
                     try:
                         rev = int(id)
                         if str(rev) != id: raise ValueError
                         if rev < 0: rev = self.count() + rev
                         if rev < 0 or rev >= self.count(): raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         c = []
                         for n in self.nodemap:
                             if hex(n).startswith(id):
                                 c.append(n)
                         if len(c) > 1: raise RevlogError(_("Ambiguous identifier"))
                         if len(c) < 1: raise RevlogError(_("No match found"))
                         return c[0]
                     return None
                 def diff(self, a, b):
                     """return a delta between two revisions"""
                     return mdiff.textdiff(a, b)
                 def patches(self, t, pl):
                     """apply a list of patches to a string"""
                     return mdiff.patches(t, pl)
                 def chunk(self, rev, df=None, cachelen=4096):
                     start, length = self.start(rev), self.length(rev)
                     inline = self.inlinedata()
                     if inline:
                         start += (rev + 1) * struct.calcsize(self.indexformat)
                     end = start + length
                     def loadcache(df):
                         cache_length = max(cachelen, length) # 4k
                         if not df:
                             if inline:
                                 df = self.opener(self.indexfile)
                             else:
                                 df = self.opener(self.datafile)
                         df.seek(start)
                         self.chunkcache = (start, df.read(cache_length))
                     if not self.chunkcache:
                         loadcache(df)
                     cache_start = self.chunkcache[0]
                     cache_end = cache_start + len(self.chunkcache[1])
                     if start >= cache_start and end <= cache_end:
                         # it is cached
                         offset = start - cache_start
                     else:
                         loadcache(df)
                         offset = 0
                     #def checkchunk():
                     #    df = self.opener(self.datafile)
                     #    df.seek(start)
                     #    return df.read(length)
                     #assert s == checkchunk()
                     return decompress(self.chunkcache[1][offset:offset + length])
                 def delta(self, node):
                     """return or calculate a delta between a node and its predecessor"""
                     r = self.rev(node)
                     return self.revdiff(r - 1, r)
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions"""
                     b1 = self.base(rev1)
                     b2 = self.base(rev2)
                     if b1 == b2 and rev1 + 1 == rev2:
                         return self.chunk(rev2)
                     else:
                         return self.diff(self.revision(self.node(rev1)),
                                          self.revision(self.node(rev2)))
                 def revision(self, node):
                     """return an uncompressed revision of a given"""
                     if node == nullid: return ""
                     if self.cache and self.cache[0] == node: return self.cache[2]
                     # look up what we need to read
                     text = None
                     rev = self.rev(node)
                     base = self.base(rev)
                     if self.inlinedata():
                         # we probably have the whole chunk cached
                         df = None
                     else:
                         df = self.opener(self.datafile)
                     # do we have useful data cached?
                     if self.cache and self.cache[1] >= base and self.cache[1] < rev:
                         base = self.cache[1]
                         text = self.cache[2]
                         self.loadindex(base, rev + 1)
                     else:
                         self.loadindex(base, rev + 1)
                         text = self.chunk(base, df=df)
                     bins = []
                     for r in xrange(base + 1, rev + 1):
                         bins.append(self.chunk(r, df=df))
                     text = self.patches(text, bins)
                     p1, p2 = self.parents(node)
                     if node != hash(text, p1, p2):
                         raise RevlogError(_("integrity check failed on %s:%d")
                                       % (self.datafile, rev))
                     self.cache = (node, rev, text)
                     return text
                 def checkinlinesize(self, tr, fp=None):
                     if not self.inlinedata():
                         return
                     if not fp:
                         fp = self.opener(self.indexfile, 'r')
                         fp.seek(0, 2)
                     size = fp.tell()
                     if size < 131072:
                         return
                     trinfo = tr.find(self.indexfile)
                     if trinfo == None:
                         raise RevlogError(_("%s not found in the transaction"  %
                                           self.indexfile))
                     trindex = trinfo[2]
                     dataoff = self.start(trindex)
                     tr.add(self.datafile, dataoff)
                     df = self.opener(self.datafile, 'w')
                     calc = struct.calcsize(self.indexformat)
                     for r in xrange(self.count()):
                         start = self.start(r) + (r + 1) * calc
                         length = self.length(r)
                         fp.seek(start)
                         d = fp.read(length)
                         df.write(d)
                     fp.close()
                     df.close()
                     fp = self.opener(self.indexfile, 'w', atomictemp=True)
                     self.version &= ~(REVLOGNGINLINEDATA)
                     if self.count():
                         x = self.index[0]
                         e = struct.pack(self.indexformat, *x)[4:]
                         l = struct.pack(versionformat, self.version)
                         fp.write(l)
                         fp.write(e)
                     for i in xrange(1, self.count()):
                         x = self.index[i]
                         e = struct.pack(self.indexformat, *x)
                         fp.write(e)
                     # if we don't call rename, the temp file will never replace the
                     # real index
                     fp.rename()
                     tr.replace(self.indexfile, trindex * calc)
                     self.chunkcache = None
                 def addrevision(self, text, transaction, link, p1=None, p2=None, d=None):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     d - an optional precomputed delta
                     """
                     if text is None: text = ""
                     if p1 is None: p1 = self.tip()
                     if p2 is None: p2 = nullid
                     node = hash(text, p1, p2)
                     if node in self.nodemap:
                         return node
                     n = self.count()
                     t = n - 1
                     if n:
                         base = self.base(t)
                         start = self.start(base)
                         end = self.end(t)
                         if not d:
                             prev = self.revision(self.tip())
                             d = self.diff(prev, str(text))
                         data = compress(d)
                         l = len(data[1]) + len(data[0])
                         dist = end - start + l
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if not n or dist > len(text) * 2:
                         data = compress(text)
                         l = len(data[1]) + len(data[0])
                         base = n
                     else:
                         base = self.base(t)
                     offset = 0
                     if t >= 0:
                         offset = self.end(t)
                     if self.version == 0:
                         e = (offset, l, base, link, p1, p2, node)
                     else:
                         e = (self.offset_type(offset, 0), l, len(text),
                              base, link, self.rev(p1), self.rev(p2), node)
                     self.index.append(e)
                     self.nodemap[node] = n
                     entry = struct.pack(self.indexformat, *e)
                     if not self.inlinedata():
                         transaction.add(self.datafile, offset)
                         transaction.add(self.indexfile, n * len(entry))
                         f = self.opener(self.datafile, "a")
                         if data[0]:
                             f.write(data[0])
                         f.write(data[1])
                         f.close()
                         f = self.opener(self.indexfile, "a")
                     else:
                         f = self.opener(self.indexfile, "a+")
                         f.seek(0, 2)
                         transaction.add(self.indexfile, f.tell(), self.count() - 1)
                     if len(self.index) == 1 and self.version != 0:
                         l = struct.pack(versionformat, self.version)
                         f.write(l)
                         entry = entry[4:]
                     f.write(entry)
                     if self.inlinedata():
                         f.write(data[0])
                         f.write(data[1])
                         self.checkinlinesize(transaction, f)
                     self.cache = (node, n, text)
                     return node
                 def ancestor(self, a, b):
                     """calculate the least common ancestor of nodes a and b"""
                     # start with some short cuts for the linear cases
                     if a == b:
                         return a
                     ra = self.rev(a)
                     rb = self.rev(b)
                     if ra < rb:
                         last = b
                         first = a
                     else:
                         last = a
                         first = b
                     # reachable won't include stop in the list, so we have to use a parent
                     reachable = self.reachable(last, stop=self.parents(first)[0])
                     if first in reachable:
                         return first
                     # calculate the distance of every node from root
                     dist = {nullid: 0}
                     for i in xrange(self.count()):
                         n = self.node(i)
                         p1, p2 = self.parents(n)
                         dist[n] = max(dist[p1], dist[p2]) + 1
                     # traverse ancestors in order of decreasing distance from root
                     def ancestors(node):
                         # we store negative distances because heap returns smallest member
                         h = [(-dist[node], node)]
                         seen = {}
                         while h:
                             d, n = heapq.heappop(h)
                             if n not in seen:
                                 seen[n] = 1
                                 yield (-d, n)
                                 for p in self.parents(n):
                                     heapq.heappush(h, (-dist[p], p))
                     def generations(node):
                         sg, s = None, {}
                         for g,n in ancestors(node):
                             if g != sg:
                                 if sg:
                                     yield sg, s
                                 sg, s = g, {n:1}
                             else:
                                 s[n] = 1
                         yield sg, s
                     x = generations(a)
                     y = generations(b)
                     gx = x.next()
                     gy = y.next()
                     # increment each ancestor list until it is closer to root than
                     # the other, or they match
                     while 1:
                         #print "ancestor gen %s %s" % (gx[0], gy[0])
                         if gx[0] == gy[0]:
                             # find the intersection
                             i = [ n for n in gx[1] if n in gy[1] ]
                             if i:
                                 return i[0]
                             else:
                                 #print "next"
                                 gy = y.next()
                                 gx = x.next()
                         elif gx[0] < gy[0]:
                             #print "next y"
                             gy = y.next()
                         else:
                             #print "next x"
                             gx = x.next()
                 def group(self, nodelist, lookup, infocollect=None):
                     """calculate a delta group
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. the first delta is
                     parent(nodes[0]) -> nodes[0] the receiver is guaranteed to
                     have this parent as it has all history before these
                     changesets. parent is parent[0]
                     """
                     revs = [self.rev(n) for n in nodelist]
                     # if we don't have any revisions touched by these changesets, bail
                     if not revs:
                         yield changegroup.closechunk()
                         return
                     # add the parent of the first rev
                     p = self.parents(self.node(revs[0]))[0]
                     revs.insert(0, self.rev(p))
                     # build deltas
                     for d in xrange(0, len(revs) - 1):
                         a, b = revs[d], revs[d + 1]
                         nb = self.node(b)
                         if infocollect is not None:
                             infocollect(nb)
                         d = self.revdiff(a, b)
                         p = self.parents(nb)
                         meta = nb + p[0] + p[1] + lookup(nb)
                         yield changegroup.genchunk("%s%s" % (meta, d))
                     yield changegroup.closechunk()
                 def addgroup(self, revs, linkmapper, transaction, unique=0):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     """
                     #track the base of the current delta log
                     r = self.count()
                     t = r - 1
                     node = None
                     base = prev = -1
                     start = end = textlen = 0
                     if r:
                         end = self.end(t)
                     ifh = self.opener(self.indexfile, "a+")
                     ifh.seek(0, 2)
                     transaction.add(self.indexfile, ifh.tell(), self.count())
                     if self.inlinedata():
                         dfh = None
                     else:
                         transaction.add(self.datafile, end)
                         dfh = self.opener(self.datafile, "a")
                     # loop through our set of deltas
                     chain = None
                     for chunk in revs:
                         node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80])
                         link = linkmapper(cs)
                         if node in self.nodemap:
                             # this can happen if two branches make the same change
                             # if unique:
                             #    raise RevlogError(_("already have %s") % hex(node[:4]))
                             chain = node
                             continue
                         delta = chunk[80:]
                         for p in (p1, p2):
                             if not p in self.nodemap:
                                 raise RevlogError(_("unknown parent %s") % short(p1))
                         if not chain:
                             # retrieve the parent revision of the delta chain
                             chain = p1
                             if not chain in self.nodemap:
                                 raise RevlogError(_("unknown base %s") % short(chain[:4]))
                         # full versions are inserted when the needed deltas become
                         # comparable to the uncompressed text or when the previous
                         # version is not the one we have a delta against. We use
                         # the size of the previous full rev as a proxy for the
                         # current size.
                         if chain == prev:
                             tempd = compress(delta)
                             cdelta = tempd[0] + tempd[1]
                             textlen = mdiff.patchedsize(textlen, delta)
                         if chain != prev or (end - start + len(cdelta)) > textlen * 2:
                             # flush our writes here so we can read it in revision
                             if dfh:
                                 dfh.flush()
                             ifh.flush()
                             text = self.revision(chain)
                             text = self.patches(text, [delta])
                             chk = self.addrevision(text, transaction, link, p1, p2)
                             if chk != node:
                                 raise RevlogError(_("consistency error adding group"))
                             textlen = len(text)
                         else:
                             if self.version == 0:
                                 e = (end, len(cdelta), base, link, p1, p2, node)
                             else:
                                 e = (self.offset_type(end, 0), len(cdelta), textlen, base,
                                      link, self.rev(p1), self.rev(p2), node)
                             self.index.append(e)
                             self.nodemap[node] = r
                             if self.inlinedata():
                                 ifh.write(struct.pack(self.indexformat, *e))
                                 ifh.write(cdelta)
                                 self.checkinlinesize(transaction, ifh)
                                 if not self.inlinedata():
                                     dfh = self.opener(self.datafile, "a")
                                     ifh = self.opener(self.indexfile, "a")
                             else:
                                 if not dfh:
                                     # addrevision switched from inline to conventional
                                     # reopen the index
                                     dfh = self.opener(self.datafile, "a")
                                     ifh = self.opener(self.indexfile, "a")
                                 dfh.write(cdelta)
                                 ifh.write(struct.pack(self.indexformat, *e))
                         t, r, chain, prev = r, r + 1, node, node
                         base = self.base(t)
                         start = self.start(base)
                         end = self.end(t)
                     if node is None:
                         raise RevlogError(_("group to be added is empty"))
                     return node
                 def strip(self, rev, minlink):
                     if self.count() == 0 or rev >= self.count():
                         return
                     if isinstance(self.index, lazyindex):
                         self.loadindexmap()
                     # When stripping away a revision, we need to make sure it
                     # does not actually belong to an older changeset.
                     # The minlink parameter defines the oldest revision
                     # we're allowed to strip away.
                     while minlink > self.index[rev][-4]:
                         rev += 1
                         if rev >= self.count():
                             return
                     # first truncate the files on disk
                     end = self.start(rev)
                     if not self.inlinedata():
                         df = self.opener(self.datafile, "a")
                         df.truncate(end)
                         end = rev * struct.calcsize(self.indexformat)
                     else:
                         end += rev * struct.calcsize(self.indexformat)
                     indexf = self.opener(self.indexfile, "a")
                     indexf.truncate(end)
                     # then reset internal state in memory to forget those revisions
                     self.cache = None
                     self.chunkcache = None
                     for x in xrange(rev, self.count()):
                         del self.nodemap[self.node(x)]
                     del self.index[rev:]
                 def checksize(self):
                     expected = 0
                     if self.count():
                         expected = self.end(self.count() - 1)
                     try:
                         f = self.opener(self.datafile)
                         f.seek(0, 2)
                         actual = f.tell()
                         dd = actual - expected
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         dd = 0
                     try:
                         f = self.opener(self.indexfile)
                         f.seek(0, 2)
                         actual = f.tell()
                         s = struct.calcsize(self.indexformat)
                         i = actual / s
                         di = actual - (i * s)
                         if self.inlinedata():
                             databytes = 0
                             for r in xrange(self.count()):
                                 databytes += self.length(r)
                             dd = 0
                             di = actual - self.count() * s - databytes
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         di = 0
                     return (dd, di)