upstream/mercurial-mirror Commit - r4277:0ce23256

1

"""

1

"""

2

revlog.py - storage back-end for mercurial

2

revlog.py - storage back-end for mercurial

3

4

This provides efficient delta storage with O(1) retrieve and append

4

This provides efficient delta storage with O(1) retrieve and append

5

and O(changes) merge between branches

5

and O(changes) merge between branches

6

7

8

9

This software may be used and distributed according to the terms

9

This software may be used and distributed according to the terms

10

of the GNU General Public License, incorporated herein by reference.

10

of the GNU General Public License, incorporated herein by reference.

11

"""

11

"""

12

13

from node import *

13

from node import *

14

from i18n import _

14

from i18n import _

15

import binascii, changegroup, errno, ancestor, mdiff, os

15

import binascii, changegroup, errno, ancestor, mdiff, os

16

import sha, struct, util, zlib

16

import sha, struct, util, zlib

17

18

# revlog version strings

18

# revlog version strings

19

REVLOGV0 = 0

19

REVLOGV0 = 0

20

REVLOGNG = 1

20

REVLOGNG = 1

21

22

# revlog flags

22

# revlog flags

23

REVLOGNGINLINEDATA = (1 << 16)

23

REVLOGNGINLINEDATA = (1 << 16)

24

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

24

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

25

26

REVLOG_DEFAULT_FORMAT = REVLOGNG

26

REVLOG_DEFAULT_FORMAT = REVLOGNG

27

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

27

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

28

29

def flagstr(flag):

29

def flagstr(flag):

30

if flag == "inline":

30

if flag == "inline":

31

return REVLOGNGINLINEDATA

31

return REVLOGNGINLINEDATA

32

raise RevlogError(_("unknown revlog flag %s") % flag)

32

raise RevlogError(_("unknown revlog flag %s") % flag)

33

34

def hash(text, p1, p2):

34

def hash(text, p1, p2):

35

"""generate a hash from the given text and its parent hashes

35

"""generate a hash from the given text and its parent hashes

36

37

This hash combines both the current file contents and its history

37

This hash combines both the current file contents and its history

38

in a manner that makes it easy to distinguish nodes with the same

38

in a manner that makes it easy to distinguish nodes with the same

39

content in the revision graph.

39

content in the revision graph.

40

"""

40

"""

41

l = [p1, p2]

41

l = [p1, p2]

42

l.sort()

42

l.sort()

43

s = sha.new(l[0])

43

s = sha.new(l[0])

44

s.update(l[1])

44

s.update(l[1])

45

s.update(text)

45

s.update(text)

46

return s.digest()

46

return s.digest()

47

48

def compress(text):

48

def compress(text):

49

""" generate a possibly-compressed representation of text """

49

""" generate a possibly-compressed representation of text """

50

if not text: return ("", text)

50

if not text: return ("", text)

51

if len(text) < 44:

51

if len(text) < 44:

52

if text[0] == '\0': return ("", text)

52

if text[0] == '\0': return ("", text)

53

return ('u', text)

53

return ('u', text)

54

bin = zlib.compress(text)

54

bin = zlib.compress(text)

55

if len(bin) > len(text):

55

if len(bin) > len(text):

56

if text[0] == '\0': return ("", text)

56

if text[0] == '\0': return ("", text)

57

return ('u', text)

57

return ('u', text)

58

return ("", bin)

58

return ("", bin)

59

60

def decompress(bin):

60

def decompress(bin):

61

""" decompress the given input """

61

""" decompress the given input """

62

if not bin: return bin

62

if not bin: return bin

63

t = bin[0]

63

t = bin[0]

64

if t == '\0': return bin

64

if t == '\0': return bin

65

if t == 'x': return zlib.decompress(bin)

65

if t == 'x': return zlib.decompress(bin)

66

if t == 'u': return bin[1:]

66

if t == 'u': return bin[1:]

67

raise RevlogError(_("unknown compression type %r") % t)

67

raise RevlogError(_("unknown compression type %r") % t)

68

69

indexformatv0 = ">4l20s20s20s"

69

indexformatv0 = ">4l20s20s20s"

70

v0shaoffset = 56

70

v0shaoffset = 56

71

# index ng:

71

# index ng:

72

# 6 bytes offset

72

# 6 bytes offset

73

# 2 bytes flags

73

# 2 bytes flags

74

# 4 bytes compressed length

74

# 4 bytes compressed length

75

# 4 bytes uncompressed length

75

# 4 bytes uncompressed length

76

# 4 bytes: base rev

76

# 4 bytes: base rev

77

# 4 bytes link rev

77

# 4 bytes link rev

78

# 4 bytes parent 1 rev

78

# 4 bytes parent 1 rev

79

# 4 bytes parent 2 rev

79

# 4 bytes parent 2 rev

80

# 32 bytes: nodeid

80

# 32 bytes: nodeid

81

indexformatng = ">Qiiiiii20s12x"

81

indexformatng = ">Qiiiiii20s12x"

82

ngshaoffset = 32

82

ngshaoffset = 32

83

versionformat = ">I"

83

versionformat = ">I"

84

85

class lazyparser(object):

85

class lazyparser(object):

86

"""

86

"""

87

this class avoids the need to parse the entirety of large indices

87

this class avoids the need to parse the entirety of large indices

88

"""

88

"""

89

90

# lazyparser is not safe to use on windows if win32 extensions not

90

# lazyparser is not safe to use on windows if win32 extensions not

91

# available. it keeps file handle open, which make it not possible

91

# available. it keeps file handle open, which make it not possible

92

# to break hardlinks on local cloned repos.

92

# to break hardlinks on local cloned repos.

93

safe_to_use = os.name != 'nt' or (not util.is_win_9x() and

93

safe_to_use = os.name != 'nt' or (not util.is_win_9x() and

94

hasattr(util, 'win32api'))

94

hasattr(util, 'win32api'))

95

96

def __init__(self, dataf, size, indexformat, shaoffset):

96

def __init__(self, dataf, size, indexformat, shaoffset):

97

self.dataf = dataf

97

self.dataf = dataf

98

self.format = indexformat

98

self.format = indexformat

99

self.s = struct.calcsize(indexformat)

99

self.s = struct.calcsize(indexformat)

100

self.indexformat = indexformat

100

self.indexformat = indexformat

101

self.datasize = size

101

self.datasize = size

102

self.l = size/self.s

102

self.l = size/self.s

103

self.index = [None] * self.l

103

self.index = [None] * self.l

104

self.map = {nullid: nullrev}

104

self.map = {nullid: nullrev}

105

self.allmap = 0

105

self.allmap = 0

106

self.all = 0

106

self.all = 0

107

self.mapfind_count = 0

107

self.mapfind_count = 0

108

self.shaoffset = shaoffset

108

self.shaoffset = shaoffset

109

110

def loadmap(self):

110

def loadmap(self):

111

"""

111

"""

112

during a commit, we need to make sure the rev being added is

112

during a commit, we need to make sure the rev being added is

113

not a duplicate. This requires loading the entire index,

113

not a duplicate. This requires loading the entire index,

114

which is fairly slow. loadmap can load up just the node map,

114

which is fairly slow. loadmap can load up just the node map,

115

which takes much less time.

115

which takes much less time.

116

"""

116

"""

117

if self.allmap: return

117

if self.allmap: return

118

end = self.datasize

118

end = self.datasize

119

self.allmap = 1

119

self.allmap = 1

120

cur = 0

120

cur = 0

121

count = 0

121

count = 0

122

blocksize = self.s * 256

122

blocksize = self.s * 256

123

self.dataf.seek(0)

123

self.dataf.seek(0)

124

while cur < end:

124

while cur < end:

125

data = self.dataf.read(blocksize)

125

data = self.dataf.read(blocksize)

126

off = 0

126

off = 0

127

for x in xrange(256):

127

for x in xrange(256):

128

n = data[off + self.shaoffset:off + self.shaoffset + 20]

128

n = data[off + self.shaoffset:off + self.shaoffset + 20]

129

self.map[n] = count

129

self.map[n] = count

130

count += 1

130

count += 1

131

if count >= self.l:

131

if count >= self.l:

132

break

132

break

133

off += self.s

133

off += self.s

134

cur += blocksize

134

cur += blocksize

135

136

def loadblock(self, blockstart, blocksize, data=None):

136

def loadblock(self, blockstart, blocksize, data=None):

137

if self.all: return

137

if self.all: return

138

if data is None:

138

if data is None:

139

self.dataf.seek(blockstart)

139

self.dataf.seek(blockstart)

140

if blockstart + blocksize > self.datasize:

140

if blockstart + blocksize > self.datasize:

141

# the revlog may have grown since we've started running,

141

# the revlog may have grown since we've started running,

142

# but we don't have space in self.index for more entries.

142

# but we don't have space in self.index for more entries.

143

# limit blocksize so that we don't get too much data.

143

# limit blocksize so that we don't get too much data.

144

blocksize = max(self.datasize - blockstart, 0)

144

blocksize = max(self.datasize - blockstart, 0)

145

data = self.dataf.read(blocksize)

145

data = self.dataf.read(blocksize)

146

lend = len(data) / self.s

146

lend = len(data) / self.s

147

i = blockstart / self.s

147

i = blockstart / self.s

148

off = 0

148

off = 0

149

# lazyindex supports __delitem__

149

# lazyindex supports __delitem__

150

if lend > len(self.index) - i:

150

if lend > len(self.index) - i:

151

lend = len(self.index) - i

151

lend = len(self.index) - i

152

for x in xrange(lend):

152

for x in xrange(lend):

153

if self.index[i + x] == None:

153

if self.index[i + x] == None:

154

b = data[off : off + self.s]

154

b = data[off : off + self.s]

155

self.index[i + x] = b

155

self.index[i + x] = b

156

n = b[self.shaoffset:self.shaoffset + 20]

156

n = b[self.shaoffset:self.shaoffset + 20]

157

self.map[n] = i + x

157

self.map[n] = i + x

158

off += self.s

158

off += self.s

159

160

def findnode(self, node):

160

def findnode(self, node):

161

"""search backwards through the index file for a specific node"""

161

"""search backwards through the index file for a specific node"""

162

if self.allmap: return None

162

if self.allmap: return None

163

164

# hg log will cause many many searches for the manifest

164

# hg log will cause many many searches for the manifest

165

# nodes. After we get called a few times, just load the whole

165

# nodes. After we get called a few times, just load the whole

166

# thing.

166

# thing.

167

if self.mapfind_count > 8:

167

if self.mapfind_count > 8:

168

self.loadmap()

168

self.loadmap()

169

if node in self.map:

169

if node in self.map:

170

return node

170

return node

171

return None

171

return None

172

self.mapfind_count += 1

172

self.mapfind_count += 1

173

last = self.l - 1

173

last = self.l - 1

174

while self.index[last] != None:

174

while self.index[last] != None:

175

if last == 0:

175

if last == 0:

176

self.all = 1

176

self.all = 1

177

self.allmap = 1

177

self.allmap = 1

178

return None

178

return None

179

last -= 1

179

last -= 1

180

end = (last + 1) * self.s

180

end = (last + 1) * self.s

181

blocksize = self.s * 256

181

blocksize = self.s * 256

182

while end >= 0:

182

while end >= 0:

183

start = max(end - blocksize, 0)

183

start = max(end - blocksize, 0)

184

self.dataf.seek(start)

184

self.dataf.seek(start)

185

data = self.dataf.read(end - start)

185

data = self.dataf.read(end - start)

186

findend = end - start

186

findend = end - start

187

while True:

187

while True:

188

# we're searching backwards, so weh have to make sure

188

# we're searching backwards, so weh have to make sure

189

# we don't find a changeset where this node is a parent

189

# we don't find a changeset where this node is a parent

190

off = data.rfind(node, 0, findend)

190

off = data.rfind(node, 0, findend)

191

findend = off

191

findend = off

192

if off >= 0:

192

if off >= 0:

193

i = off / self.s

193

i = off / self.s

194

off = i * self.s

194

off = i * self.s

195

n = data[off + self.shaoffset:off + self.shaoffset + 20]

195

n = data[off + self.shaoffset:off + self.shaoffset + 20]

196

if n == node:

196

if n == node:

197

self.map[n] = i + start / self.s

197

self.map[n] = i + start / self.s

198

return node

198

return node

199

else:

199

else:

200

break

200

break

201

end -= blocksize

201

end -= blocksize

202

return None

202

return None

203

204

def loadindex(self, i=None, end=None):

204

def loadindex(self, i=None, end=None):

205

if self.all: return

205

if self.all: return

206

all = False

206

all = False

207

if i == None:

207

if i == None:

208

blockstart = 0

208

blockstart = 0

209

blocksize = (512 / self.s) * self.s

209

blocksize = (512 / self.s) * self.s

210

end = self.datasize

210

end = self.datasize

211

all = True

211

all = True

212

else:

212

else:

213

if end:

213

if end:

214

blockstart = i * self.s

214

blockstart = i * self.s

215

end = end * self.s

215

end = end * self.s

216

blocksize = end - blockstart

216

blocksize = end - blockstart

217

else:

217

else:

218

blockstart = (i & ~(32)) * self.s

218

blockstart = (i & ~(32)) * self.s

219

blocksize = self.s * 64

219

blocksize = self.s * 64

220

end = blockstart + blocksize

220

end = blockstart + blocksize

221

while blockstart < end:

221

while blockstart < end:

222

self.loadblock(blockstart, blocksize)

222

self.loadblock(blockstart, blocksize)

223

blockstart += blocksize

223

blockstart += blocksize

224

if all: self.all = True

224

if all: self.all = True

225

226

class lazyindex(object):

226

class lazyindex(object):

227

"""a lazy version of the index array"""

227

"""a lazy version of the index array"""

228

def __init__(self, parser):

228

def __init__(self, parser):

229

self.p = parser

229

self.p = parser

230

def __len__(self):

230

def __len__(self):

231

return len(self.p.index)

231

return len(self.p.index)

232

def load(self, pos):

232

def load(self, pos):

233

if pos < 0:

233

if pos < 0:

234

pos += len(self.p.index)

234

pos += len(self.p.index)

235

self.p.loadindex(pos)

235

self.p.loadindex(pos)

236

return self.p.index[pos]

236

return self.p.index[pos]

237

def __getitem__(self, pos):

237

def __getitem__(self, pos):

238

ret = self.p.index[pos] or self.load(pos)

238

ret = self.p.index[pos] or self.load(pos)

239

if isinstance(ret, str):

239

if isinstance(ret, str):

240

ret = struct.unpack(self.p.indexformat, ret)

240

ret = struct.unpack(self.p.indexformat, ret)

241

return ret

241

return ret

242

def __setitem__(self, pos, item):

242

def __setitem__(self, pos, item):

243

self.p.index[pos] = item

243

self.p.index[pos] = item

244

def __delitem__(self, pos):

244

def __delitem__(self, pos):

245

del self.p.index[pos]

245

del self.p.index[pos]

246

def append(self, e):

246

def append(self, e):

247

self.p.index.append(e)

247

self.p.index.append(e)

248

249

class lazymap(object):

249

class lazymap(object):

250

"""a lazy version of the node map"""

250

"""a lazy version of the node map"""

251

def __init__(self, parser):

251

def __init__(self, parser):

252

self.p = parser

252

self.p = parser

253

def load(self, key):

253

def load(self, key):

254

n = self.p.findnode(key)

254

n = self.p.findnode(key)

255

if n == None:

255

if n == None:

256

raise KeyError(key)

256

raise KeyError(key)

257

def __contains__(self, key):

257

def __contains__(self, key):

258

if key in self.p.map:

258

if key in self.p.map:

259

return True

259

return True

260

self.p.loadmap()

260

self.p.loadmap()

261

return key in self.p.map

261

return key in self.p.map

262

def __iter__(self):

262

def __iter__(self):

263

yield nullid

263

yield nullid

264

for i in xrange(self.p.l):

264

for i in xrange(self.p.l):

265

ret = self.p.index[i]

265

ret = self.p.index[i]

266

if not ret:

266

if not ret:

267

self.p.loadindex(i)

267

self.p.loadindex(i)

268

ret = self.p.index[i]

268

ret = self.p.index[i]

269

if isinstance(ret, str):

269

if isinstance(ret, str):

270

ret = struct.unpack(self.p.indexformat, ret)

270

ret = struct.unpack(self.p.indexformat, ret)

271

yield ret[-1]

271

yield ret[-1]

272

def __getitem__(self, key):

272

def __getitem__(self, key):

273

try:

273

try:

274

return self.p.map[key]

274

return self.p.map[key]

275

except KeyError:

275

except KeyError:

276

try:

276

try:

277

self.load(key)

277

self.load(key)

278

return self.p.map[key]

278

return self.p.map[key]

279

except KeyError:

279

except KeyError:

280

raise KeyError("node " + hex(key))

280

raise KeyError("node " + hex(key))

281

def __setitem__(self, key, val):

281

def __setitem__(self, key, val):

282

self.p.map[key] = val

282

self.p.map[key] = val

283

def __delitem__(self, key):

283

def __delitem__(self, key):

284

del self.p.map[key]

284

del self.p.map[key]

285

286

class RevlogError(Exception): pass

286

class RevlogError(Exception): pass

287

class LookupError(RevlogError): pass

287

class LookupError(RevlogError): pass

288

289

class revlog(object):

289

class revlog(object):

290

"""

290

"""

291

the underlying revision storage object

291

the underlying revision storage object

292

293

A revlog consists of two parts, an index and the revision data.

293

A revlog consists of two parts, an index and the revision data.

294

295

The index is a file with a fixed record size containing

295

The index is a file with a fixed record size containing

296

information on each revision, includings its nodeid (hash), the

296

information on each revision, includings its nodeid (hash), the

297

nodeids of its parents, the position and offset of its data within

297

nodeids of its parents, the position and offset of its data within

298

the data file, and the revision it's based on. Finally, each entry

298

the data file, and the revision it's based on. Finally, each entry

299

contains a linkrev entry that can serve as a pointer to external

299

contains a linkrev entry that can serve as a pointer to external

300

data.

300

data.

301

302

The revision data itself is a linear collection of data chunks.

302

The revision data itself is a linear collection of data chunks.

303

Each chunk represents a revision and is usually represented as a

303

Each chunk represents a revision and is usually represented as a

304

delta against the previous chunk. To bound lookup time, runs of

304

delta against the previous chunk. To bound lookup time, runs of

305

deltas are limited to about 2 times the length of the original

305

deltas are limited to about 2 times the length of the original

306

version data. This makes retrieval of a version proportional to

306

version data. This makes retrieval of a version proportional to

307

its size, or O(1) relative to the number of revisions.

307

its size, or O(1) relative to the number of revisions.

308

309

Both pieces of the revlog are written to in an append-only

309

Both pieces of the revlog are written to in an append-only

310

fashion, which means we never need to rewrite a file to insert or

310

fashion, which means we never need to rewrite a file to insert or

311

remove data, and can use some simple techniques to avoid the need

311

remove data, and can use some simple techniques to avoid the need

312

for locking while reading.

312

for locking while reading.

313

"""

313

"""

314

def __init__(self, opener, indexfile):

314

def __init__(self, opener, indexfile):

315

"""

315

"""

316

create a revlog object

316

create a revlog object

317

318

opener is a function that abstracts the file opening operation

318

opener is a function that abstracts the file opening operation

319

and can be used to implement COW semantics or the like.

319

and can be used to implement COW semantics or the like.

320

"""

320

"""

321

self.indexfile = indexfile

321

self.indexfile = indexfile

322

self.datafile = indexfile[:-2] + ".d"

322

self.datafile = indexfile[:-2] + ".d"

323

self.opener = opener

323

self.opener = opener

324

325

self.indexstat = None

325

self.indexstat = None

326

self.cache = None

326

self.cache = None

327

self.chunkcache = None

327

self.chunkcache = None

328

self.defversion=REVLOG_DEFAULT_VERSION

328

self.defversion = REVLOG_DEFAULT_VERSION

329

if hasattr(opener, "defversion"):

329

if hasattr(opener, "defversion"):

330

self.defversion = opener.defversion

330

self.defversion = opener.defversion

331

self.load()

331

self.load()

332

333

def load(self):

333

def load(self):

334

v = self.defversion

334

v = self.defversion

335

try:

335

try:

336

f = self.opener(self.indexfile)

336

f = self.opener(self.indexfile)

337

i = f.read(4)

337

i = f.read(4)

338

f.seek(0)

338

f.seek(0)

339

except IOError, inst:

339

except IOError, inst:

340

if inst.errno != errno.ENOENT:

340

if inst.errno != errno.ENOENT:

341

raise

341

raise

342

i = ""

342

i = ""

343

else:

343

else:

344

try:

344

try:

345

st = util.fstat(f)

345

st = util.fstat(f)

346

except AttributeError, inst:

346

except AttributeError, inst:

347

st = None

347

st = None

348

else:

348

else:

349

oldst = self.indexstat

349

oldst = self.indexstat

350

if (oldst and st.st_dev == oldst.st_dev

350

if (oldst and st.st_dev == oldst.st_dev

351

and st.st_ino == oldst.st_ino

351

and st.st_ino == oldst.st_ino

352

and st.st_mtime == oldst.st_mtime

352

and st.st_mtime == oldst.st_mtime

353

and st.st_ctime == oldst.st_ctime):

353

and st.st_ctime == oldst.st_ctime):

354

return

354

return

355

self.indexstat = st

355

self.indexstat = st

356

if len(i) > 0:

356

if len(i) > 0:

357

v = struct.unpack(versionformat, i)[0]

357

v = struct.unpack(versionformat, i)[0]

358

flags = v & ~0xFFFF

358

flags = v & ~0xFFFF

359

fmt = v & 0xFFFF

359

fmt = v & 0xFFFF

360

if fmt == REVLOGV0:

360

if fmt == REVLOGV0:

361

if flags:

361

if flags:

362

raise RevlogError(_("index %s unknown flags %#04x for format v0")

362

raise RevlogError(_("index %s unknown flags %#04x for format v0")

363

% (self.indexfile, flags >> 16))

363

% (self.indexfile, flags >> 16))

364

elif fmt == REVLOGNG:

364

elif fmt == REVLOGNG:

365

if flags & ~REVLOGNGINLINEDATA:

365

if flags & ~REVLOGNGINLINEDATA:

366

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

366

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

367

% (self.indexfile, flags >> 16))

367

% (self.indexfile, flags >> 16))

368

else:

368

else:

369

raise RevlogError(_("index %s unknown format %d")

369

raise RevlogError(_("index %s unknown format %d")

370

% (self.indexfile, fmt))

370

% (self.indexfile, fmt))

371

self.version = v

371

self.version = v

372

if v == REVLOGV0:

372

if v == REVLOGV0:

373

self.indexformat = indexformatv0

373

self.indexformat = indexformatv0

374

shaoffset = v0shaoffset

374

shaoffset = v0shaoffset

375

else:

375

else:

376

self.indexformat = indexformatng

376

self.indexformat = indexformatng

377

shaoffset = ngshaoffset

377

shaoffset = ngshaoffset

378

379

if i:

379

if i:

380

if (lazyparser.safe_to_use and not self.inlinedata() and

380

if (lazyparser.safe_to_use and not self.inlinedata() and

381

st and st.st_size > 10000):

381

st and st.st_size > 10000):

382

# big index, let's parse it on demand

382

# big index, let's parse it on demand

383

parser = lazyparser(f, st.st_size, self.indexformat, shaoffset)

383

parser = lazyparser(f, st.st_size, self.indexformat, shaoffset)

384

self.index = lazyindex(parser)

384

self.index = lazyindex(parser)

385

self.nodemap = lazymap(parser)

385

self.nodemap = lazymap(parser)

386

else:

386

else:

387

self.parseindex(f, st)

387

self.parseindex(f, st)

388

if self.version != REVLOGV0:

388

if self.version != REVLOGV0:

389

e = list(self.index[0])

389

e = list(self.index[0])

390

type = self.ngtype(e[0])

390

type = self.ngtype(e[0])

391

e[0] = self.offset_type(0, type)

391

e[0] = self.offset_type(0, type)

392

self.index[0] = e

392

self.index[0] = e

393

else:

393

else:

394

self.nodemap = {nullid: nullrev}

394

self.nodemap = {nullid: nullrev}

395

self.index = []

395

self.index = []

396

397

398

def parseindex(self, fp, st):

398

def parseindex(self, fp, st):

399

s = struct.calcsize(self.indexformat)

399

s = struct.calcsize(self.indexformat)

400

self.index = []

400

self.index = []

401

self.nodemap = {nullid: nullrev}

401

self.nodemap = {nullid: nullrev}

402

inline = self.inlinedata()

402

inline = self.inlinedata()

403

n = 0

403

n = 0

404

leftover = None

404

leftover = None

405

while True:

405

while True:

406

if st:

406

if st:

407

data = fp.read(65536)

407

data = fp.read(65536)

408

else:

408

else:

409

# hack for httprangereader, it doesn't do partial reads well

409

# hack for httprangereader, it doesn't do partial reads well

410

data = fp.read()

410

data = fp.read()

411

if not data:

411

if not data:

412

break

412

break

413

if n == 0 and self.inlinedata():

413

if n == 0 and self.inlinedata():

414

# cache the first chunk

414

# cache the first chunk

415

self.chunkcache = (0, data)

415

self.chunkcache = (0, data)

416

if leftover:

416

if leftover:

417

data = leftover + data

417

data = leftover + data

418

leftover = None

418

leftover = None

419

off = 0

419

off = 0

420

l = len(data)

420

l = len(data)

421

while off < l:

421

while off < l:

422

if l - off < s:

422

if l - off < s:

423

leftover = data[off:]

423

leftover = data[off:]

424

break

424

break

425

cur = data[off:off + s]

425

cur = data[off:off + s]

426

off += s

426

off += s

427

e = struct.unpack(self.indexformat, cur)

427

e = struct.unpack(self.indexformat, cur)

428

self.index.append(e)

428

self.index.append(e)

429

self.nodemap[e[-1]] = n

429

self.nodemap[e[-1]] = n

430

n += 1

430

n += 1

431

if inline:

431

if inline:

432

if e[1] < 0:

432

if e[1] < 0:

433

break

433

break

434

off += e[1]

434

off += e[1]

435

if off > l:

435

if off > l:

436

# some things don't seek well, just read it

436

# some things don't seek well, just read it

437

fp.read(off - l)

437

fp.read(off - l)

438

break

438

break

439

if not st:

439

if not st:

440

break

440

break

441

442

443

def ngoffset(self, q):

443

def ngoffset(self, q):

444

if q & 0xFFFF:

444

if q & 0xFFFF:

445

raise RevlogError(_('%s: incompatible revision flag %x') %

445

raise RevlogError(_('%s: incompatible revision flag %x') %

446

(self.indexfile, q))

446

(self.indexfile, q))

447

return long(q >> 16)

447

return long(q >> 16)

448

449

def ngtype(self, q):

449

def ngtype(self, q):

450

return int(q & 0xFFFF)

450

return int(q & 0xFFFF)

451

452

def offset_type(self, offset, type):

452

def offset_type(self, offset, type):

453

return long(long(offset) << 16 | type)

453

return long(long(offset) << 16 | type)

454

455

def loadindex(self, start, end):

455

def loadindex(self, start, end):

456

"""load a block of indexes all at once from the lazy parser"""

456

"""load a block of indexes all at once from the lazy parser"""

457

if isinstance(self.index, lazyindex):

457

if isinstance(self.index, lazyindex):

458

self.index.p.loadindex(start, end)

458

self.index.p.loadindex(start, end)

459

460

def loadindexmap(self):

460

def loadindexmap(self):

461

"""loads both the map and the index from the lazy parser"""

461

"""loads both the map and the index from the lazy parser"""

462

if isinstance(self.index, lazyindex):

462

if isinstance(self.index, lazyindex):

463

p = self.index.p

463

p = self.index.p

464

p.loadindex()

464

p.loadindex()

465

self.nodemap = p.map

465

self.nodemap = p.map

466

467

def loadmap(self):

467

def loadmap(self):

468

"""loads the map from the lazy parser"""

468

"""loads the map from the lazy parser"""

469

if isinstance(self.nodemap, lazymap):

469

if isinstance(self.nodemap, lazymap):

470

self.nodemap.p.loadmap()

470

self.nodemap.p.loadmap()

471

self.nodemap = self.nodemap.p.map

471

self.nodemap = self.nodemap.p.map

472

473

def inlinedata(self): return self.version & REVLOGNGINLINEDATA

473

def inlinedata(self): return self.version & REVLOGNGINLINEDATA

474

def tip(self): return self.node(len(self.index) - 1)

474

def tip(self): return self.node(len(self.index) - 1)

475

def count(self): return len(self.index)

475

def count(self): return len(self.index)

476

def node(self, rev):

476

def node(self, rev):

477

return rev == nullrev and nullid or self.index[rev][-1]

477

return rev == nullrev and nullid or self.index[rev][-1]

478

def rev(self, node):

478

def rev(self, node):

479

try:

479

try:

480

return self.nodemap[node]

480

return self.nodemap[node]

481

except KeyError:

481

except KeyError:

482

raise LookupError(_('%s: no node %s') % (self.indexfile, hex(node)))

482

raise LookupError(_('%s: no node %s') % (self.indexfile, hex(node)))

483

def linkrev(self, node):

483

def linkrev(self, node):

484

return (node == nullid) and nullrev or self.index[self.rev(node)][-4]

484

return (node == nullid) and nullrev or self.index[self.rev(node)][-4]

485

def parents(self, node):

485

def parents(self, node):

486

if node == nullid: return (nullid, nullid)

486

if node == nullid: return (nullid, nullid)

487

r = self.rev(node)

487

r = self.rev(node)

488

d = self.index[r][-3:-1]

488

d = self.index[r][-3:-1]

489

if self.version == REVLOGV0:

489

if self.version == REVLOGV0:

490

return d

490

return d

491

return (self.node(d[0]), self.node(d[1]))

491

return (self.node(d[0]), self.node(d[1]))

492

def parentrevs(self, rev):

492

def parentrevs(self, rev):

493

if rev == nullrev:

493

if rev == nullrev:

494

return (nullrev, nullrev)

494

return (nullrev, nullrev)

495

d = self.index[rev][-3:-1]

495

d = self.index[rev][-3:-1]

496

if self.version == REVLOGV0:

496

if self.version == REVLOGV0:

497

return (self.rev(d[0]), self.rev(d[1]))

497

return (self.rev(d[0]), self.rev(d[1]))

498

return d

498

return d

499

def start(self, rev):

499

def start(self, rev):

500

if rev == nullrev:

500

if rev == nullrev:

501

return 0

501

return 0

502

if self.version != REVLOGV0:

502

if self.version != REVLOGV0:

503

return self.ngoffset(self.index[rev][0])

503

return self.ngoffset(self.index[rev][0])

504

return self.index[rev][0]

504

return self.index[rev][0]

505

506

def end(self, rev): return self.start(rev) + self.length(rev)

506

def end(self, rev): return self.start(rev) + self.length(rev)

507

508

def size(self, rev):

508

def size(self, rev):

509

"""return the length of the uncompressed text for a given revision"""

509

"""return the length of the uncompressed text for a given revision"""

510

if rev == nullrev:

510

if rev == nullrev:

511

return 0

511

return 0

512

l = -1

512

l = -1

513

if self.version != REVLOGV0:

513

if self.version != REVLOGV0:

514

l = self.index[rev][2]

514

l = self.index[rev][2]

515

if l >= 0:

515

if l >= 0:

516

return l

516

return l

517

518

t = self.revision(self.node(rev))

518

t = self.revision(self.node(rev))

519

return len(t)

519

return len(t)

520

521

# alternate implementation, The advantage to this code is it

521

# alternate implementation, The advantage to this code is it

522

# will be faster for a single revision. But, the results are not

522

# will be faster for a single revision. But, the results are not

523

# cached, so finding the size of every revision will be slower.

523

# cached, so finding the size of every revision will be slower.

524

"""

524

"""

525

if self.cache and self.cache[1] == rev:

525

if self.cache and self.cache[1] == rev:

526

return len(self.cache[2])

526

return len(self.cache[2])

527

528

base = self.base(rev)

528

base = self.base(rev)

529

if self.cache and self.cache[1] >= base and self.cache[1] < rev:

529

if self.cache and self.cache[1] >= base and self.cache[1] < rev:

530

base = self.cache[1]

530

base = self.cache[1]

531

text = self.cache[2]

531

text = self.cache[2]

532

else:

532

else:

533

text = self.revision(self.node(base))

533

text = self.revision(self.node(base))

534

535

l = len(text)

535

l = len(text)

536

for x in xrange(base + 1, rev + 1):

536

for x in xrange(base + 1, rev + 1):

537

l = mdiff.patchedsize(l, self.chunk(x))

537

l = mdiff.patchedsize(l, self.chunk(x))

538

return l

538

return l

539

"""

539

"""

540

541

def length(self, rev):

541

def length(self, rev):

542

if rev == nullrev:

542

if rev == nullrev:

543

return 0

543

return 0

544

else:

544

else:

545

return self.index[rev][1]

545

return self.index[rev][1]

546

def base(self, rev):

546

def base(self, rev):

547

if (rev == nullrev):

547

if (rev == nullrev):

548

return nullrev

548

return nullrev

549

else:

549

else:

550

return self.index[rev][-5]

550

return self.index[rev][-5]

551

552

def reachable(self, node, stop=None):

552

def reachable(self, node, stop=None):

553

"""return a hash of all nodes ancestral to a given node, including

553

"""return a hash of all nodes ancestral to a given node, including

554

the node itself, stopping when stop is matched"""

554

the node itself, stopping when stop is matched"""

555

reachable = {}

555

reachable = {}

556

visit = [node]

556

visit = [node]

557

reachable[node] = 1

557

reachable[node] = 1

558

if stop:

558

if stop:

559

stopn = self.rev(stop)

559

stopn = self.rev(stop)

560

else:

560

else:

561

stopn = 0

561

stopn = 0

562

while visit:

562

while visit:

563

n = visit.pop(0)

563

n = visit.pop(0)

564

if n == stop:

564

if n == stop:

565

continue

565

continue

566

if n == nullid:

566

if n == nullid:

567

continue

567

continue

568

for p in self.parents(n):

568

for p in self.parents(n):

569

if self.rev(p) < stopn:

569

if self.rev(p) < stopn:

570

continue

570

continue

571

if p not in reachable:

571

if p not in reachable:

572

reachable[p] = 1

572

reachable[p] = 1

573

visit.append(p)

573

visit.append(p)

574

return reachable

574

return reachable

575

576

def nodesbetween(self, roots=None, heads=None):

576

def nodesbetween(self, roots=None, heads=None):

577

"""Return a tuple containing three elements. Elements 1 and 2 contain

577

"""Return a tuple containing three elements. Elements 1 and 2 contain

578

a final list bases and heads after all the unreachable ones have been

578

a final list bases and heads after all the unreachable ones have been

579

pruned. Element 0 contains a topologically sorted list of all

579

pruned. Element 0 contains a topologically sorted list of all

580

581

nodes that satisfy these constraints:

581

nodes that satisfy these constraints:

582

1. All nodes must be descended from a node in roots (the nodes on

582

1. All nodes must be descended from a node in roots (the nodes on

583

roots are considered descended from themselves).

583

roots are considered descended from themselves).

584

2. All nodes must also be ancestors of a node in heads (the nodes in

584

2. All nodes must also be ancestors of a node in heads (the nodes in

585

heads are considered to be their own ancestors).

585

heads are considered to be their own ancestors).

586

587

If roots is unspecified, nullid is assumed as the only root.

587

If roots is unspecified, nullid is assumed as the only root.

588

If heads is unspecified, it is taken to be the output of the

588

If heads is unspecified, it is taken to be the output of the

589

heads method (i.e. a list of all nodes in the repository that

589

heads method (i.e. a list of all nodes in the repository that

590

have no children)."""

590

have no children)."""

591

nonodes = ([], [], [])

591

nonodes = ([], [], [])

592

if roots is not None:

592

if roots is not None:

593

roots = list(roots)

593

roots = list(roots)

594

if not roots:

594

if not roots:

595

return nonodes

595

return nonodes

596

lowestrev = min([self.rev(n) for n in roots])

596

lowestrev = min([self.rev(n) for n in roots])

597

else:

597

else:

598

roots = [nullid] # Everybody's a descendent of nullid

598

roots = [nullid] # Everybody's a descendent of nullid

599

lowestrev = nullrev

599

lowestrev = nullrev

600

if (lowestrev == nullrev) and (heads is None):

600

if (lowestrev == nullrev) and (heads is None):

601

# We want _all_ the nodes!

601

# We want _all_ the nodes!

602

return ([self.node(r) for r in xrange(0, self.count())],

602

return ([self.node(r) for r in xrange(0, self.count())],

603

[nullid], list(self.heads()))

603

[nullid], list(self.heads()))

604

if heads is None:

604

if heads is None:

605

# All nodes are ancestors, so the latest ancestor is the last

605

# All nodes are ancestors, so the latest ancestor is the last

606

# node.

606

# node.

607

highestrev = self.count() - 1

607

highestrev = self.count() - 1

608

# Set ancestors to None to signal that every node is an ancestor.

608

# Set ancestors to None to signal that every node is an ancestor.

609

ancestors = None

609

ancestors = None

610

# Set heads to an empty dictionary for later discovery of heads

610

# Set heads to an empty dictionary for later discovery of heads

611

heads = {}

611

heads = {}

612

else:

612

else:

613

heads = list(heads)

613

heads = list(heads)

614

if not heads:

614

if not heads:

615

return nonodes

615

return nonodes

616

ancestors = {}

616

ancestors = {}

617

# Turn heads into a dictionary so we can remove 'fake' heads.

617

# Turn heads into a dictionary so we can remove 'fake' heads.

618

# Also, later we will be using it to filter out the heads we can't

618

# Also, later we will be using it to filter out the heads we can't

619

# find from roots.

619

# find from roots.

620

heads = dict.fromkeys(heads, 0)

620

heads = dict.fromkeys(heads, 0)

621

# Start at the top and keep marking parents until we're done.

621

# Start at the top and keep marking parents until we're done.

622

nodestotag = heads.keys()

622

nodestotag = heads.keys()

623

# Remember where the top was so we can use it as a limit later.

623

# Remember where the top was so we can use it as a limit later.

624

highestrev = max([self.rev(n) for n in nodestotag])

624

highestrev = max([self.rev(n) for n in nodestotag])

625

while nodestotag:

625

while nodestotag:

626

# grab a node to tag

626

# grab a node to tag

627

n = nodestotag.pop()

627

n = nodestotag.pop()

628

# Never tag nullid

628

# Never tag nullid

629

if n == nullid:

629

if n == nullid:

630

continue

630

continue

631

# A node's revision number represents its place in a

631

# A node's revision number represents its place in a

632

# topologically sorted list of nodes.

632

# topologically sorted list of nodes.

633

r = self.rev(n)

633

r = self.rev(n)

634

if r >= lowestrev:

634

if r >= lowestrev:

635

if n not in ancestors:

635

if n not in ancestors:

636

# If we are possibly a descendent of one of the roots

636

# If we are possibly a descendent of one of the roots

637

# and we haven't already been marked as an ancestor

637

# and we haven't already been marked as an ancestor

638

ancestors[n] = 1 # Mark as ancestor

638

ancestors[n] = 1 # Mark as ancestor

639

# Add non-nullid parents to list of nodes to tag.

639

# Add non-nullid parents to list of nodes to tag.

640

nodestotag.extend([p for p in self.parents(n) if

640

nodestotag.extend([p for p in self.parents(n) if

641

p != nullid])

641

p != nullid])

642

elif n in heads: # We've seen it before, is it a fake head?

642

elif n in heads: # We've seen it before, is it a fake head?

643

# So it is, real heads should not be the ancestors of

643

# So it is, real heads should not be the ancestors of

644

# any other heads.

644

# any other heads.

645

heads.pop(n)

645

heads.pop(n)

646

if not ancestors:

646

if not ancestors:

647

return nonodes

647

return nonodes

648

# Now that we have our set of ancestors, we want to remove any

648

# Now that we have our set of ancestors, we want to remove any

649

# roots that are not ancestors.

649

# roots that are not ancestors.

650

651

# If one of the roots was nullid, everything is included anyway.

651

# If one of the roots was nullid, everything is included anyway.

652

if lowestrev > nullrev:

652

if lowestrev > nullrev:

653

# But, since we weren't, let's recompute the lowest rev to not

653

# But, since we weren't, let's recompute the lowest rev to not

654

# include roots that aren't ancestors.

654

# include roots that aren't ancestors.

655

656

# Filter out roots that aren't ancestors of heads

656

# Filter out roots that aren't ancestors of heads

657

roots = [n for n in roots if n in ancestors]

657

roots = [n for n in roots if n in ancestors]

658

# Recompute the lowest revision

658

# Recompute the lowest revision

659

if roots:

659

if roots:

660

lowestrev = min([self.rev(n) for n in roots])

660

lowestrev = min([self.rev(n) for n in roots])

661

else:

661

else:

662

# No more roots? Return empty list

662

# No more roots? Return empty list

663

return nonodes

663

return nonodes

664

else:

664

else:

665

# We are descending from nullid, and don't need to care about

665

# We are descending from nullid, and don't need to care about

666

# any other roots.

666

# any other roots.

667

lowestrev = nullrev

667

lowestrev = nullrev

668

roots = [nullid]

668

roots = [nullid]

669

# Transform our roots list into a 'set' (i.e. a dictionary where the

669

# Transform our roots list into a 'set' (i.e. a dictionary where the

670

# values don't matter.

670

# values don't matter.

671

descendents = dict.fromkeys(roots, 1)

671

descendents = dict.fromkeys(roots, 1)

672

# Also, keep the original roots so we can filter out roots that aren't

672

# Also, keep the original roots so we can filter out roots that aren't

673

# 'real' roots (i.e. are descended from other roots).

673

# 'real' roots (i.e. are descended from other roots).

674

roots = descendents.copy()

674

roots = descendents.copy()

675

# Our topologically sorted list of output nodes.

675

# Our topologically sorted list of output nodes.

676

orderedout = []

676

orderedout = []

677

# Don't start at nullid since we don't want nullid in our output list,

677

# Don't start at nullid since we don't want nullid in our output list,

678

# and if nullid shows up in descedents, empty parents will look like

678

# and if nullid shows up in descedents, empty parents will look like

679

# they're descendents.

679

# they're descendents.

680

for r in xrange(max(lowestrev, 0), highestrev + 1):

680

for r in xrange(max(lowestrev, 0), highestrev + 1):

681

n = self.node(r)

681

n = self.node(r)

682

isdescendent = False

682

isdescendent = False

683

if lowestrev == nullrev: # Everybody is a descendent of nullid

683

if lowestrev == nullrev: # Everybody is a descendent of nullid

684

isdescendent = True

684

isdescendent = True

685

elif n in descendents:

685

elif n in descendents:

686

# n is already a descendent

686

# n is already a descendent

687

isdescendent = True

687

isdescendent = True

688

# This check only needs to be done here because all the roots

688

# This check only needs to be done here because all the roots

689

# will start being marked is descendents before the loop.

689

# will start being marked is descendents before the loop.

690

if n in roots:

690

if n in roots:

691

# If n was a root, check if it's a 'real' root.

691

# If n was a root, check if it's a 'real' root.

692

p = tuple(self.parents(n))

692

p = tuple(self.parents(n))

693

# If any of its parents are descendents, it's not a root.

693

# If any of its parents are descendents, it's not a root.

694

if (p[0] in descendents) or (p[1] in descendents):

694

if (p[0] in descendents) or (p[1] in descendents):

695

roots.pop(n)

695

roots.pop(n)

696

else:

696

else:

697

p = tuple(self.parents(n))

697

p = tuple(self.parents(n))

698

# A node is a descendent if either of its parents are

698

# A node is a descendent if either of its parents are

699

# descendents. (We seeded the dependents list with the roots

699

# descendents. (We seeded the dependents list with the roots

700

# up there, remember?)

700

# up there, remember?)

701

if (p[0] in descendents) or (p[1] in descendents):

701

if (p[0] in descendents) or (p[1] in descendents):

702

descendents[n] = 1

702

descendents[n] = 1

703

isdescendent = True

703

isdescendent = True

704

if isdescendent and ((ancestors is None) or (n in ancestors)):

704

if isdescendent and ((ancestors is None) or (n in ancestors)):

705

# Only include nodes that are both descendents and ancestors.

705

# Only include nodes that are both descendents and ancestors.

706

orderedout.append(n)

706

orderedout.append(n)

707

if (ancestors is not None) and (n in heads):

707

if (ancestors is not None) and (n in heads):

708

# We're trying to figure out which heads are reachable

708

# We're trying to figure out which heads are reachable

709

# from roots.

709

# from roots.

710

# Mark this head as having been reached

710

# Mark this head as having been reached

711

heads[n] = 1

711

heads[n] = 1

712

elif ancestors is None:

712

elif ancestors is None:

713

# Otherwise, we're trying to discover the heads.

713

# Otherwise, we're trying to discover the heads.

714

# Assume this is a head because if it isn't, the next step

714

# Assume this is a head because if it isn't, the next step

715

# will eventually remove it.

715

# will eventually remove it.

716

heads[n] = 1

716

heads[n] = 1

717

# But, obviously its parents aren't.

717

# But, obviously its parents aren't.

718

for p in self.parents(n):

718

for p in self.parents(n):

719

heads.pop(p, None)

719

heads.pop(p, None)

720

heads = [n for n in heads.iterkeys() if heads[n] != 0]

720

heads = [n for n in heads.iterkeys() if heads[n] != 0]

721

roots = roots.keys()

721

roots = roots.keys()

722

assert orderedout

722

assert orderedout

723

assert roots

723

assert roots

724

assert heads

724

assert heads

725

return (orderedout, roots, heads)

725

return (orderedout, roots, heads)

726

727

def heads(self, start=None, stop=None):

727

def heads(self, start=None, stop=None):

728

"""return the list of all nodes that have no children

728

"""return the list of all nodes that have no children

729

730

if start is specified, only heads that are descendants of

730

if start is specified, only heads that are descendants of

731

start will be returned

731

start will be returned

732

if stop is specified, it will consider all the revs from stop

732

if stop is specified, it will consider all the revs from stop

733

as if they had no children

733

as if they had no children

734

"""

734

"""

735

if start is None:

735

if start is None:

736

start = nullid

736

start = nullid

737

if stop is None:

737

if stop is None:

738

stop = []

738

stop = []

739

stoprevs = dict.fromkeys([self.rev(n) for n in stop])

739

stoprevs = dict.fromkeys([self.rev(n) for n in stop])

740

startrev = self.rev(start)

740

startrev = self.rev(start)

741

reachable = {startrev: 1}

741

reachable = {startrev: 1}

742

heads = {startrev: 1}

742

heads = {startrev: 1}

743

744

parentrevs = self.parentrevs

744

parentrevs = self.parentrevs

745

for r in xrange(startrev + 1, self.count()):

745

for r in xrange(startrev + 1, self.count()):

746

for p in parentrevs(r):

746

for p in parentrevs(r):

747

if p in reachable:

747

if p in reachable:

748

if r not in stoprevs:

748

if r not in stoprevs:

749

reachable[r] = 1

749

reachable[r] = 1

750

heads[r] = 1

750

heads[r] = 1

751

if p in heads and p not in stoprevs:

751

if p in heads and p not in stoprevs:

752

del heads[p]

752

del heads[p]

753

754

return [self.node(r) for r in heads]

754

return [self.node(r) for r in heads]

755

756

def children(self, node):

756

def children(self, node):

757

"""find the children of a given node"""

757

"""find the children of a given node"""

758

c = []

758

c = []

759

p = self.rev(node)

759

p = self.rev(node)

760

for r in range(p + 1, self.count()):

760

for r in range(p + 1, self.count()):

761

for pr in self.parentrevs(r):

761

for pr in self.parentrevs(r):

762

if pr == p:

762

if pr == p:

763

c.append(self.node(r))

763

c.append(self.node(r))

764

return c

764

return c

765

766

def _match(self, id):

766

def _match(self, id):

767

if isinstance(id, (long, int)):

767

if isinstance(id, (long, int)):

768

# rev

768

# rev

769

return self.node(id)

769

return self.node(id)

770

if len(id) == 20:

770

if len(id) == 20:

771

# possibly a binary node

771

# possibly a binary node

772

# odds of a binary node being all hex in ASCII are 1 in 10**25

772

# odds of a binary node being all hex in ASCII are 1 in 10**25

773

try:

773

try:

774

node = id

774

node = id

775

r = self.rev(node) # quick search the index

775

r = self.rev(node) # quick search the index

776

return node

776

return node

777

except LookupError:

777

except LookupError:

778

pass # may be partial hex id

778

pass # may be partial hex id

779

try:

779

try:

780

# str(rev)

780

# str(rev)

781

rev = int(id)

781

rev = int(id)

782

if str(rev) != id: raise ValueError

782

if str(rev) != id: raise ValueError

783

if rev < 0: rev = self.count() + rev

783

if rev < 0: rev = self.count() + rev

784

if rev < 0 or rev >= self.count(): raise ValueError

784

if rev < 0 or rev >= self.count(): raise ValueError

785

return self.node(rev)

785

return self.node(rev)

786

except (ValueError, OverflowError):

786

except (ValueError, OverflowError):

787

pass

787

pass

788

if len(id) == 40:

788

if len(id) == 40:

789

try:

789

try:

790

# a full hex nodeid?

790

# a full hex nodeid?

791

node = bin(id)

791

node = bin(id)

792

r = self.rev(node)

792

r = self.rev(node)

793

return node

793

return node

794

except TypeError:

794

except TypeError:

795

pass

795

pass

796

797

def _partialmatch(self, id):

797

def _partialmatch(self, id):

798

if len(id) < 40:

798

if len(id) < 40:

799

try:

799

try:

800

# hex(node)[:...]

800

# hex(node)[:...]

801

bin_id = bin(id[:len(id) & ~1]) # grab an even number of digits

801

bin_id = bin(id[:len(id) & ~1]) # grab an even number of digits

802

node = None

802

node = None

803

for n in self.nodemap:

803

for n in self.nodemap:

804

if n.startswith(bin_id) and hex(n).startswith(id):

804

if n.startswith(bin_id) and hex(n).startswith(id):

805

if node is not None:

805

if node is not None:

806

raise LookupError(_("Ambiguous identifier"))

806

raise LookupError(_("Ambiguous identifier"))

807

node = n

807

node = n

808

if node is not None:

808

if node is not None:

809

return node

809

return node

810

except TypeError:

810

except TypeError:

811

pass

811

pass

812

813

def lookup(self, id):

813

def lookup(self, id):

814

"""locate a node based on:

814

"""locate a node based on:

815

- revision number or str(revision number)

815

- revision number or str(revision number)

816

- nodeid or subset of hex nodeid

816

- nodeid or subset of hex nodeid

817

"""

817

"""

818

819

n = self._match(id)

819

n = self._match(id)

820

if n is not None:

820

if n is not None:

821

return n

821

return n

822

n = self._partialmatch(id)

822

n = self._partialmatch(id)

823

if n:

823

if n:

824

return n

824

return n

825

826

raise LookupError(_("No match found"))

826

raise LookupError(_("No match found"))

827

828

def cmp(self, node, text):

828

def cmp(self, node, text):

829

"""compare text with a given file revision"""

829

"""compare text with a given file revision"""

830

p1, p2 = self.parents(node)

830

p1, p2 = self.parents(node)

831

return hash(text, p1, p2) != node

831

return hash(text, p1, p2) != node

832

833

def makenode(self, node, text):

833

def makenode(self, node, text):

834

"""calculate a file nodeid for text, descended or possibly

834

"""calculate a file nodeid for text, descended or possibly

835

unchanged from node"""

835

unchanged from node"""

836

837

if self.cmp(node, text):

837

if self.cmp(node, text):

838

return hash(text, node, nullid)

838

return hash(text, node, nullid)

839

return node

839

return node

840

841

def diff(self, a, b):

841

def diff(self, a, b):

842

"""return a delta between two revisions"""

842

"""return a delta between two revisions"""

843

return mdiff.textdiff(a, b)

843

return mdiff.textdiff(a, b)

844

845

def patches(self, t, pl):

845

def patches(self, t, pl):

846

"""apply a list of patches to a string"""

846

"""apply a list of patches to a string"""

847

return mdiff.patches(t, pl)

847

return mdiff.patches(t, pl)

848

849

def chunk(self, rev, df=None, cachelen=4096):

849

def chunk(self, rev, df=None, cachelen=4096):

850

start, length = self.start(rev), self.length(rev)

850

start, length = self.start(rev), self.length(rev)

851

inline = self.inlinedata()

851

inline = self.inlinedata()

852

if inline:

852

if inline:

853

start += (rev + 1) * struct.calcsize(self.indexformat)

853

start += (rev + 1) * struct.calcsize(self.indexformat)

854

end = start + length

854

end = start + length

855

def loadcache(df):

855

def loadcache(df):

856

cache_length = max(cachelen, length) # 4k

856

cache_length = max(cachelen, length) # 4k

857

if not df:

857

if not df:

858

if inline:

858

if inline:

859

df = self.opener(self.indexfile)

859

df = self.opener(self.indexfile)

860

else:

860

else:

861

df = self.opener(self.datafile)

861

df = self.opener(self.datafile)

862

df.seek(start)

862

df.seek(start)

863

self.chunkcache = (start, df.read(cache_length))

863

self.chunkcache = (start, df.read(cache_length))

864

865

if not self.chunkcache:

865

if not self.chunkcache:

866

loadcache(df)

866

loadcache(df)

867

868

cache_start = self.chunkcache[0]

868

cache_start = self.chunkcache[0]

869

cache_end = cache_start + len(self.chunkcache[1])

869

cache_end = cache_start + len(self.chunkcache[1])

870

if start >= cache_start and end <= cache_end:

870

if start >= cache_start and end <= cache_end:

871

# it is cached

871

# it is cached

872

offset = start - cache_start

872

offset = start - cache_start

873

else:

873

else:

874

loadcache(df)

874

loadcache(df)

875

offset = 0

875

offset = 0

876

877

#def checkchunk():

877

#def checkchunk():

878

# df = self.opener(self.datafile)

878

# df = self.opener(self.datafile)

879

# df.seek(start)

879

# df.seek(start)

880

# return df.read(length)

880

# return df.read(length)

881

#assert s == checkchunk()

881

#assert s == checkchunk()

882

return decompress(self.chunkcache[1][offset:offset + length])

882

return decompress(self.chunkcache[1][offset:offset + length])

883

884

def delta(self, node):

884

def delta(self, node):

885

"""return or calculate a delta between a node and its predecessor"""

885

"""return or calculate a delta between a node and its predecessor"""

886

r = self.rev(node)

886

r = self.rev(node)

887

return self.revdiff(r - 1, r)

887

return self.revdiff(r - 1, r)

888

889

def revdiff(self, rev1, rev2):

889

def revdiff(self, rev1, rev2):

890

"""return or calculate a delta between two revisions"""

890

"""return or calculate a delta between two revisions"""

891

b1 = self.base(rev1)

891

b1 = self.base(rev1)

892

b2 = self.base(rev2)

892

b2 = self.base(rev2)

893

if b1 == b2 and rev1 + 1 == rev2:

893

if b1 == b2 and rev1 + 1 == rev2:

894

return self.chunk(rev2)

894

return self.chunk(rev2)

895

else:

895

else:

896

return self.diff(self.revision(self.node(rev1)),

896

return self.diff(self.revision(self.node(rev1)),

897

self.revision(self.node(rev2)))

897

self.revision(self.node(rev2)))

898

899

def revision(self, node):

899

def revision(self, node):

900

"""return an uncompressed revision of a given"""

900

"""return an uncompressed revision of a given"""

901

if node == nullid: return ""

901

if node == nullid: return ""

902

if self.cache and self.cache[0] == node: return self.cache[2]

902

if self.cache and self.cache[0] == node: return self.cache[2]

903

904

# look up what we need to read

904

# look up what we need to read

905

text = None

905

text = None

906

rev = self.rev(node)

906

rev = self.rev(node)

907

base = self.base(rev)

907

base = self.base(rev)

908

909

if self.inlinedata():

909

if self.inlinedata():

910

# we probably have the whole chunk cached

910

# we probably have the whole chunk cached

911

df = None

911

df = None

912

else:

912

else:

913

df = self.opener(self.datafile)

913

df = self.opener(self.datafile)

914

915

# do we have useful data cached?

915

# do we have useful data cached?

916

if self.cache and self.cache[1] >= base and self.cache[1] < rev:

916

if self.cache and self.cache[1] >= base and self.cache[1] < rev:

917

base = self.cache[1]

917

base = self.cache[1]

918

text = self.cache[2]

918

text = self.cache[2]

919

self.loadindex(base, rev + 1)

919

self.loadindex(base, rev + 1)

920

else:

920

else:

921

self.loadindex(base, rev + 1)

921

self.loadindex(base, rev + 1)

922

text = self.chunk(base, df=df)

922

text = self.chunk(base, df=df)

923

924

bins = []

924

bins = []

925

for r in xrange(base + 1, rev + 1):

925

for r in xrange(base + 1, rev + 1):

926

bins.append(self.chunk(r, df=df))

926

bins.append(self.chunk(r, df=df))

927

928

text = self.patches(text, bins)

928

text = self.patches(text, bins)

929

930

p1, p2 = self.parents(node)

930

p1, p2 = self.parents(node)

931

if node != hash(text, p1, p2):

931

if node != hash(text, p1, p2):

932

raise RevlogError(_("integrity check failed on %s:%d")

932

raise RevlogError(_("integrity check failed on %s:%d")

933

% (self.datafile, rev))

933

% (self.datafile, rev))

934

935

self.cache = (node, rev, text)

935

self.cache = (node, rev, text)

936

return text

936

return text

937

938

def checkinlinesize(self, tr, fp=None):

938

def checkinlinesize(self, tr, fp=None):

939

if not self.inlinedata():

939

if not self.inlinedata():

940

return

940

return

941

if not fp:

941

if not fp:

942

fp = self.opener(self.indexfile, 'r')

942

fp = self.opener(self.indexfile, 'r')

943

fp.seek(0, 2)

943

fp.seek(0, 2)

944

size = fp.tell()

944

size = fp.tell()

945

if size < 131072:

945

if size < 131072:

946

return

946

return

947

trinfo = tr.find(self.indexfile)

947

trinfo = tr.find(self.indexfile)

948

if trinfo == None:

948

if trinfo == None:

949

raise RevlogError(_("%s not found in the transaction")

949

raise RevlogError(_("%s not found in the transaction")

950

% self.indexfile)

950

% self.indexfile)

951

952

trindex = trinfo[2]

952

trindex = trinfo[2]

953

dataoff = self.start(trindex)

953

dataoff = self.start(trindex)

954

955

tr.add(self.datafile, dataoff)

955

tr.add(self.datafile, dataoff)

956

df = self.opener(self.datafile, 'w')

956

df = self.opener(self.datafile, 'w')

957

calc = struct.calcsize(self.indexformat)

957

calc = struct.calcsize(self.indexformat)

958

for r in xrange(self.count()):

958

for r in xrange(self.count()):

959

start = self.start(r) + (r + 1) * calc

959

start = self.start(r) + (r + 1) * calc

960

length = self.length(r)

960

length = self.length(r)

961

fp.seek(start)

961

fp.seek(start)

962

d = fp.read(length)

962

d = fp.read(length)

963

df.write(d)

963

df.write(d)

964

fp.close()

964

fp.close()

965

df.close()

965

df.close()

966

fp = self.opener(self.indexfile, 'w', atomictemp=True)

966

fp = self.opener(self.indexfile, 'w', atomictemp=True)

967

self.version &= ~(REVLOGNGINLINEDATA)

967

self.version &= ~(REVLOGNGINLINEDATA)

968

if self.count():

968

if self.count():

969

x = self.index[0]

969

x = self.index[0]

970

e = struct.pack(self.indexformat, *x)[4:]

970

e = struct.pack(self.indexformat, *x)[4:]

971

l = struct.pack(versionformat, self.version)

971

l = struct.pack(versionformat, self.version)

972

fp.write(l)

972

fp.write(l)

973

fp.write(e)

973

fp.write(e)

974

975

for i in xrange(1, self.count()):

975

for i in xrange(1, self.count()):

976

x = self.index[i]

976

x = self.index[i]

977

e = struct.pack(self.indexformat, *x)

977

e = struct.pack(self.indexformat, *x)

978

fp.write(e)

978

fp.write(e)

979

980

# if we don't call rename, the temp file will never replace the

980

# if we don't call rename, the temp file will never replace the

981

# real index

981

# real index

982

fp.rename()

982

fp.rename()

983

984

tr.replace(self.indexfile, trindex * calc)

984

tr.replace(self.indexfile, trindex * calc)

985

self.chunkcache = None

985

self.chunkcache = None

986

987

def addrevision(self, text, transaction, link, p1=None, p2=None, d=None):

987

def addrevision(self, text, transaction, link, p1=None, p2=None, d=None):

988

"""add a revision to the log

988

"""add a revision to the log

989

990

text - the revision data to add

990

text - the revision data to add

991

transaction - the transaction object used for rollback

991

transaction - the transaction object used for rollback

992

link - the linkrev data to add

992

link - the linkrev data to add

993

p1, p2 - the parent nodeids of the revision

993

p1, p2 - the parent nodeids of the revision

994

d - an optional precomputed delta

994

d - an optional precomputed delta

995

"""

995

"""

996

if not self.inlinedata():

996

if not self.inlinedata():

997

dfh = self.opener(self.datafile, "a")

997

dfh = self.opener(self.datafile, "a")

998

else:

998

else:

999

dfh = None

999

dfh = None

1000

ifh = self.opener(self.indexfile, "a+")

1000

ifh = self.opener(self.indexfile, "a+")

1001

return self._addrevision(text, transaction, link, p1, p2, d, ifh, dfh)

1001

return self._addrevision(text, transaction, link, p1, p2, d, ifh, dfh)

1002

1003

def _addrevision(self, text, transaction, link, p1, p2, d, ifh, dfh):

1003

def _addrevision(self, text, transaction, link, p1, p2, d, ifh, dfh):

1004

if text is None: text = ""

1004

if text is None: text = ""

1005

if p1 is None: p1 = self.tip()

1005

if p1 is None: p1 = self.tip()

1006

if p2 is None: p2 = nullid

1006

if p2 is None: p2 = nullid

1007

1008

node = hash(text, p1, p2)

1008

node = hash(text, p1, p2)

1009

1010

if node in self.nodemap:

1010

if node in self.nodemap:

1011

return node

1011

return node

1012

1013

n = self.count()

1013

n = self.count()

1014

t = n - 1

1014

t = n - 1

1015

1016

if n:

1016

if n:

1017

base = self.base(t)

1017

base = self.base(t)

1018

start = self.start(base)

1018

start = self.start(base)

1019

end = self.end(t)

1019

end = self.end(t)

1020

if not d:

1020

if not d:

1021

prev = self.revision(self.tip())

1021

prev = self.revision(self.tip())

1022

d = self.diff(prev, text)

1022

d = self.diff(prev, text)

1023

data = compress(d)

1023

data = compress(d)

1024

l = len(data[1]) + len(data[0])

1024

l = len(data[1]) + len(data[0])

1025

dist = end - start + l

1025

dist = end - start + l

1026

1027

# full versions are inserted when the needed deltas

1027

# full versions are inserted when the needed deltas

1028

# become comparable to the uncompressed text

1028

# become comparable to the uncompressed text

1029

if not n or dist > len(text) * 2:

1029

if not n or dist > len(text) * 2:

1030

data = compress(text)

1030

data = compress(text)

1031

l = len(data[1]) + len(data[0])

1031

l = len(data[1]) + len(data[0])

1032

base = n

1032

base = n

1033

else:

1033

else:

1034

base = self.base(t)

1034

base = self.base(t)

1035

1036

offset = 0

1036

offset = 0

1037

if t >= 0:

1037

if t >= 0:

1038

offset = self.end(t)

1038

offset = self.end(t)

1039

1040

if self.version == REVLOGV0:

1040

if self.version == REVLOGV0:

1041

e = (offset, l, base, link, p1, p2, node)

1041

e = (offset, l, base, link, p1, p2, node)

1042

else:

1042

else:

1043

e = (self.offset_type(offset, 0), l, len(text),

1043

e = (self.offset_type(offset, 0), l, len(text),

1044

base, link, self.rev(p1), self.rev(p2), node)

1044

base, link, self.rev(p1), self.rev(p2), node)

1045

1046

self.index.append(e)

1046

self.index.append(e)

1047

self.nodemap[node] = n

1047

self.nodemap[node] = n

1048

entry = struct.pack(self.indexformat, *e)

1048

entry = struct.pack(self.indexformat, *e)

1049

1050

if not self.inlinedata():

1050

if not self.inlinedata():

1051

transaction.add(self.datafile, offset)

1051

transaction.add(self.datafile, offset)

1052

transaction.add(self.indexfile, n * len(entry))

1052

transaction.add(self.indexfile, n * len(entry))

1053

if data[0]:

1053

if data[0]:

1054

dfh.write(data[0])

1054

dfh.write(data[0])

1055

dfh.write(data[1])

1055

dfh.write(data[1])

1056

dfh.flush()

1056

dfh.flush()

1057

else:

1057

else:

1058

ifh.seek(0, 2)

1058

ifh.seek(0, 2)

1059

transaction.add(self.indexfile, ifh.tell(), self.count() - 1)

1059

transaction.add(self.indexfile, ifh.tell(), self.count() - 1)

1060

1061

if len(self.index) == 1 and self.version != REVLOGV0:

1061

if len(self.index) == 1 and self.version != REVLOGV0:

1062

l = struct.pack(versionformat, self.version)

1062

l = struct.pack(versionformat, self.version)

1063

ifh.write(l)

1063

ifh.write(l)

1064

entry = entry[4:]

1064

entry = entry[4:]

1065

1066

ifh.write(entry)

1066

ifh.write(entry)

1067

1068

if self.inlinedata():

1068

if self.inlinedata():

1069

ifh.write(data[0])

1069

ifh.write(data[0])

1070

ifh.write(data[1])

1070

ifh.write(data[1])

1071

self.checkinlinesize(transaction, ifh)

1071

self.checkinlinesize(transaction, ifh)

1072

1073

self.cache = (node, n, text)

1073

self.cache = (node, n, text)

1074

return node

1074

return node

1075

1076

def ancestor(self, a, b):

1076

def ancestor(self, a, b):

1077

"""calculate the least common ancestor of nodes a and b"""

1077

"""calculate the least common ancestor of nodes a and b"""

1078

1079

def parents(rev):

1079

def parents(rev):

1080

return [p for p in self.parentrevs(rev) if p != nullrev]

1080

return [p for p in self.parentrevs(rev) if p != nullrev]

1081

1082

c = ancestor.ancestor(self.rev(a), self.rev(b), parents)

1082

c = ancestor.ancestor(self.rev(a), self.rev(b), parents)

1083

if c is None:

1083

if c is None:

1084

return nullid

1084

return nullid

1085

1086

return self.node(c)

1086

return self.node(c)

1087

1088

def group(self, nodelist, lookup, infocollect=None):

1088

def group(self, nodelist, lookup, infocollect=None):

1089

"""calculate a delta group

1089

"""calculate a delta group

1090

1091

Given a list of changeset revs, return a set of deltas and

1091

Given a list of changeset revs, return a set of deltas and

1092

metadata corresponding to nodes. the first delta is

1092

metadata corresponding to nodes. the first delta is

1093

parent(nodes[0]) -> nodes[0] the receiver is guaranteed to

1093

parent(nodes[0]) -> nodes[0] the receiver is guaranteed to

1094

have this parent as it has all history before these

1094

have this parent as it has all history before these

1095

changesets. parent is parent[0]

1095

changesets. parent is parent[0]

1096

"""

1096

"""

1097

revs = [self.rev(n) for n in nodelist]

1097

revs = [self.rev(n) for n in nodelist]

1098

1099

# if we don't have any revisions touched by these changesets, bail

1099

# if we don't have any revisions touched by these changesets, bail

1100

if not revs:

1100

if not revs:

1101

yield changegroup.closechunk()

1101

yield changegroup.closechunk()

1102

return

1102

return

1103

1104

# add the parent of the first rev

1104

# add the parent of the first rev

1105

p = self.parents(self.node(revs[0]))[0]

1105

p = self.parents(self.node(revs[0]))[0]

1106

revs.insert(0, self.rev(p))

1106

revs.insert(0, self.rev(p))

1107

1108

# build deltas

1108

# build deltas

1109

for d in xrange(0, len(revs) - 1):

1109

for d in xrange(0, len(revs) - 1):

1110

a, b = revs[d], revs[d + 1]

1110

a, b = revs[d], revs[d + 1]

1111

nb = self.node(b)

1111

nb = self.node(b)

1112

1113

if infocollect is not None:

1113

if infocollect is not None:

1114

infocollect(nb)

1114

infocollect(nb)

1115

1116

d = self.revdiff(a, b)

1116

d = self.revdiff(a, b)

1117

p = self.parents(nb)

1117

p = self.parents(nb)

1118

meta = nb + p[0] + p[1] + lookup(nb)

1118

meta = nb + p[0] + p[1] + lookup(nb)

1119

yield changegroup.genchunk("%s%s" % (meta, d))

1119

yield changegroup.genchunk("%s%s" % (meta, d))

1120

1121

yield changegroup.closechunk()

1121

yield changegroup.closechunk()

1122

1123

def addgroup(self, revs, linkmapper, transaction, unique=0):

1123

def addgroup(self, revs, linkmapper, transaction, unique=0):

1124

"""

1124

"""

1125

add a delta group

1125

add a delta group

1126

1127

given a set of deltas, add them to the revision log. the

1127

given a set of deltas, add them to the revision log. the

1128

first delta is against its parent, which should be in our

1128

first delta is against its parent, which should be in our

1129

log, the rest are against the previous delta.

1129

log, the rest are against the previous delta.

1130

"""

1130

"""

1131

1132

#track the base of the current delta log

1132

#track the base of the current delta log

1133

r = self.count()

1133

r = self.count()

1134

t = r - 1

1134

t = r - 1

1135

node = None

1135

node = None

1136

1137

base = prev = nullrev

1137

base = prev = nullrev

1138

start = end = textlen = 0

1138

start = end = textlen = 0

1139

if r:

1139

if r:

1140

end = self.end(t)

1140

end = self.end(t)

1141

1142

ifh = self.opener(self.indexfile, "a+")

1142

ifh = self.opener(self.indexfile, "a+")

1143

ifh.seek(0, 2)

1143

ifh.seek(0, 2)

1144

transaction.add(self.indexfile, ifh.tell(), self.count())

1144

transaction.add(self.indexfile, ifh.tell(), self.count())

1145

if self.inlinedata():

1145

if self.inlinedata():

1146

dfh = None

1146

dfh = None

1147

else:

1147

else:

1148

transaction.add(self.datafile, end)

1148

transaction.add(self.datafile, end)

1149

dfh = self.opener(self.datafile, "a")

1149

dfh = self.opener(self.datafile, "a")

1150

1151

# loop through our set of deltas

1151

# loop through our set of deltas

1152

chain = None

1152

chain = None

1153

for chunk in revs:

1153

for chunk in revs:

1154

node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80])

1154

node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80])

1155

link = linkmapper(cs)

1155

link = linkmapper(cs)

1156

if node in self.nodemap:

1156

if node in self.nodemap:

1157

# this can happen if two branches make the same change

1157

# this can happen if two branches make the same change

1158

# if unique:

1158

# if unique:

1159

# raise RevlogError(_("already have %s") % hex(node[:4]))

1159

# raise RevlogError(_("already have %s") % hex(node[:4]))

1160

chain = node

1160

chain = node

1161

continue

1161

continue

1162

delta = chunk[80:]

1162

delta = chunk[80:]

1163

1164

for p in (p1, p2):

1164

for p in (p1, p2):

1165

if not p in self.nodemap:

1165

if not p in self.nodemap:

1166

raise LookupError(_("unknown parent %s") % short(p))

1166

raise LookupError(_("unknown parent %s") % short(p))

1167

1168

if not chain:

1168

if not chain:

1169

# retrieve the parent revision of the delta chain

1169

# retrieve the parent revision of the delta chain

1170

chain = p1

1170

chain = p1

1171

if not chain in self.nodemap:

1171

if not chain in self.nodemap:

1172

raise LookupError(_("unknown base %s") % short(chain[:4]))

1172

raise LookupError(_("unknown base %s") % short(chain[:4]))

1173

1174

# full versions are inserted when the needed deltas become

1174

# full versions are inserted when the needed deltas become

1175

# comparable to the uncompressed text or when the previous

1175

# comparable to the uncompressed text or when the previous

1176

# version is not the one we have a delta against. We use

1176

# version is not the one we have a delta against. We use

1177

# the size of the previous full rev as a proxy for the

1177

# the size of the previous full rev as a proxy for the

1178

# current size.

1178

# current size.

1179

1180

if chain == prev:

1180

if chain == prev:

1181

tempd = compress(delta)

1181

tempd = compress(delta)

1182

cdelta = tempd[0] + tempd[1]

1182

cdelta = tempd[0] + tempd[1]

1183

textlen = mdiff.patchedsize(textlen, delta)

1183

textlen = mdiff.patchedsize(textlen, delta)

1184

1185

if chain != prev or (end - start + len(cdelta)) > textlen * 2:

1185

if chain != prev or (end - start + len(cdelta)) > textlen * 2:

1186

# flush our writes here so we can read it in revision

1186

# flush our writes here so we can read it in revision

1187

if dfh:

1187

if dfh:

1188

dfh.flush()

1188

dfh.flush()

1189

ifh.flush()

1189

ifh.flush()

1190

text = self.revision(chain)

1190

text = self.revision(chain)

1191

text = self.patches(text, [delta])

1191

text = self.patches(text, [delta])

1192

chk = self._addrevision(text, transaction, link, p1, p2, None,

1192

chk = self._addrevision(text, transaction, link, p1, p2, None,

1193

ifh, dfh)

1193

ifh, dfh)

1194

if not dfh and not self.inlinedata():

1194

if not dfh and not self.inlinedata():

1195

# addrevision switched from inline to conventional

1195

# addrevision switched from inline to conventional

1196

# reopen the index

1196

# reopen the index

1197

dfh = self.opener(self.datafile, "a")

1197

dfh = self.opener(self.datafile, "a")

1198

ifh = self.opener(self.indexfile, "a")

1198

ifh = self.opener(self.indexfile, "a")

1199

if chk != node:

1199

if chk != node:

1200

raise RevlogError(_("consistency error adding group"))

1200

raise RevlogError(_("consistency error adding group"))

1201

textlen = len(text)

1201

textlen = len(text)

1202

else:

1202

else:

1203

if self.version == REVLOGV0:

1203

if self.version == REVLOGV0:

1204

e = (end, len(cdelta), base, link, p1, p2, node)

1204

e = (end, len(cdelta), base, link, p1, p2, node)

1205

else:

1205

else:

1206

e = (self.offset_type(end, 0), len(cdelta), textlen, base,

1206

e = (self.offset_type(end, 0), len(cdelta), textlen, base,

1207

link, self.rev(p1), self.rev(p2), node)

1207

link, self.rev(p1), self.rev(p2), node)

1208

self.index.append(e)

1208

self.index.append(e)

1209

self.nodemap[node] = r

1209

self.nodemap[node] = r

1210

if self.inlinedata():

1210

if self.inlinedata():

1211

ifh.write(struct.pack(self.indexformat, *e))

1211

ifh.write(struct.pack(self.indexformat, *e))

1212

ifh.write(cdelta)

1212

ifh.write(cdelta)

1213

self.checkinlinesize(transaction, ifh)

1213

self.checkinlinesize(transaction, ifh)

1214

if not self.inlinedata():

1214

if not self.inlinedata():

1215

dfh = self.opener(self.datafile, "a")

1215

dfh = self.opener(self.datafile, "a")

1216

ifh = self.opener(self.indexfile, "a")

1216

ifh = self.opener(self.indexfile, "a")

1217

else:

1217

else:

1218

dfh.write(cdelta)

1218

dfh.write(cdelta)

1219

ifh.write(struct.pack(self.indexformat, *e))

1219

ifh.write(struct.pack(self.indexformat, *e))

1220

1221

t, r, chain, prev = r, r + 1, node, node

1221

t, r, chain, prev = r, r + 1, node, node

1222

base = self.base(t)

1222

base = self.base(t)

1223

start = self.start(base)

1223

start = self.start(base)

1224

end = self.end(t)

1224

end = self.end(t)

1225

1226

return node

1226

return node

1227

1228

def strip(self, rev, minlink):

1228

def strip(self, rev, minlink):

1229

if self.count() == 0 or rev >= self.count():

1229

if self.count() == 0 or rev >= self.count():

1230

return

1230

return

1231

1232

if isinstance(self.index, lazyindex):

1232

if isinstance(self.index, lazyindex):

1233

self.loadindexmap()

1233

self.loadindexmap()

1234

1235

# When stripping away a revision, we need to make sure it

1235

# When stripping away a revision, we need to make sure it

1236

# does not actually belong to an older changeset.

1236

# does not actually belong to an older changeset.

1237

# The minlink parameter defines the oldest revision

1237

# The minlink parameter defines the oldest revision

1238

# we're allowed to strip away.

1238

# we're allowed to strip away.

1239

while minlink > self.index[rev][-4]:

1239

while minlink > self.index[rev][-4]:

1240

rev += 1

1240

rev += 1

1241

if rev >= self.count():

1241

if rev >= self.count():

1242

return

1242

return

1243

1244

# first truncate the files on disk

1244

# first truncate the files on disk

1245

end = self.start(rev)

1245

end = self.start(rev)

1246

if not self.inlinedata():

1246

if not self.inlinedata():

1247

df = self.opener(self.datafile, "a")

1247

df = self.opener(self.datafile, "a")

1248

df.truncate(end)

1248

df.truncate(end)

1249

end = rev * struct.calcsize(self.indexformat)

1249

end = rev * struct.calcsize(self.indexformat)

1250

else:

1250

else:

1251

end += rev * struct.calcsize(self.indexformat)

1251

end += rev * struct.calcsize(self.indexformat)

1252

1253

indexf = self.opener(self.indexfile, "a")

1253

indexf = self.opener(self.indexfile, "a")

1254

indexf.truncate(end)

1254

indexf.truncate(end)

1255

1256

# then reset internal state in memory to forget those revisions

1256

# then reset internal state in memory to forget those revisions

1257

self.cache = None

1257

self.cache = None

1258

self.chunkcache = None

1258

self.chunkcache = None

1259

for x in xrange(rev, self.count()):

1259

for x in xrange(rev, self.count()):

1260

del self.nodemap[self.node(x)]

1260

del self.nodemap[self.node(x)]

1261

1262

del self.index[rev:]

1262

del self.index[rev:]

1263

1264

def checksize(self):

1264

def checksize(self):

1265

expected = 0

1265

expected = 0

1266

if self.count():

1266

if self.count():

1267

expected = self.end(self.count() - 1)

1267

expected = self.end(self.count() - 1)

1268

1269

try:

1269

try:

1270

f = self.opener(self.datafile)

1270

f = self.opener(self.datafile)

1271

f.seek(0, 2)

1271

f.seek(0, 2)

1272

actual = f.tell()

1272

actual = f.tell()

1273

dd = actual - expected

1273

dd = actual - expected

1274

except IOError, inst:

1274

except IOError, inst:

1275

if inst.errno != errno.ENOENT:

1275

if inst.errno != errno.ENOENT:

1276

raise

1276

raise

1277

dd = 0

1277

dd = 0

1278

1279

try:

1279

try:

1280

f = self.opener(self.indexfile)

1280

f = self.opener(self.indexfile)

1281

f.seek(0, 2)

1281

f.seek(0, 2)

1282

actual = f.tell()

1282

actual = f.tell()

1283

s = struct.calcsize(self.indexformat)

1283

s = struct.calcsize(self.indexformat)

1284

i = actual / s

1284

i = actual / s

1285

di = actual - (i * s)

1285

di = actual - (i * s)

1286

if self.inlinedata():

1286

if self.inlinedata():

1287

databytes = 0

1287

databytes = 0

1288

for r in xrange(self.count()):

1288

for r in xrange(self.count()):

1289

databytes += self.length(r)

1289

databytes += self.length(r)

1290

dd = 0

1290

dd = 0

1291

di = actual - self.count() * s - databytes

1291

di = actual - self.count() * s - databytes

1292

except IOError, inst:

1292

except IOError, inst:

1293

if inst.errno != errno.ENOENT:

1293

if inst.errno != errno.ENOENT:

1294

raise

1294

raise

1295

di = 0

1295

di = 0

1296

1297

return (dd, di)

1297

return (dd, di)

1298

1299

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             """
             revlog.py - storage back-end for mercurial
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches
             Copyright 2005, 2006 Matt Mackall <mpm@selenic.com>
             This software may be used and distributed according to the terms
             of the GNU General Public License, incorporated herein by reference.
             """
             from node import *
             from i18n import _
             import binascii, changegroup, errno, ancestor, mdiff, os
             import sha, struct, util, zlib
             # revlog version strings
             REVLOGV0 = 0
             REVLOGNG = 1
             # revlog flags
             REVLOGNGINLINEDATA = (1 << 16)
             REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA
             REVLOG_DEFAULT_FORMAT = REVLOGNG
             REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS
             def flagstr(flag):
                 if flag == "inline":
                     return REVLOGNGINLINEDATA
                 raise RevlogError(_("unknown revlog flag %s") % flag)
             def hash(text, p1, p2):
                 """generate a hash from the given text and its parent hashes
                 This hash combines both the current file contents and its history
                 in a manner that makes it easy to distinguish nodes with the same
                 content in the revision graph.
                 """
                 l = [p1, p2]
                 l.sort()
                 s = sha.new(l[0])
                 s.update(l[1])
                 s.update(text)
                 return s.digest()
             def compress(text):
                 """ generate a possibly-compressed representation of text """
                 if not text: return ("", text)
                 if len(text) < 44:
                     if text[0] == '\0': return ("", text)
                     return ('u', text)
                 bin = zlib.compress(text)
                 if len(bin) > len(text):
                     if text[0] == '\0': return ("", text)
                     return ('u', text)
                 return ("", bin)
             def decompress(bin):
                 """ decompress the given input """
                 if not bin: return bin
                 t = bin[0]
                 if t == '\0': return bin
                 if t == 'x': return zlib.decompress(bin)
                 if t == 'u': return bin[1:]
                 raise RevlogError(_("unknown compression type %r") % t)
             indexformatv0 = ">4l20s20s20s"
             v0shaoffset = 56
             # index ng:
             # 6 bytes offset
             # 2 bytes flags
             # 4 bytes compressed length
             # 4 bytes uncompressed length
             # 4 bytes: base rev
             # 4 bytes link rev
             # 4 bytes parent 1 rev
             # 4 bytes parent 2 rev
             # 32 bytes: nodeid
             indexformatng = ">Qiiiiii20s12x"
             ngshaoffset = 32
             versionformat = ">I"
             class lazyparser(object):
                 """
                 this class avoids the need to parse the entirety of large indices
                 """
                 # lazyparser is not safe to use on windows if win32 extensions not
                 # available. it keeps file handle open, which make it not possible
                 # to break hardlinks on local cloned repos.
                 safe_to_use = os.name != 'nt' or (not util.is_win_9x() and
                                                   hasattr(util, 'win32api'))
                 def __init__(self, dataf, size, indexformat, shaoffset):
                     self.dataf = dataf
                     self.format = indexformat
                     self.s = struct.calcsize(indexformat)
                     self.indexformat = indexformat
                     self.datasize = size
                     self.l = size/self.s
                     self.index = [None] * self.l
                     self.map = {nullid: nullrev}
                     self.allmap = 0
                     self.all = 0
                     self.mapfind_count = 0
                     self.shaoffset = shaoffset
                 def loadmap(self):
                     """
                     during a commit, we need to make sure the rev being added is
                     not a duplicate.  This requires loading the entire index,
                     which is fairly slow.  loadmap can load up just the node map,
                     which takes much less time.
                     """
                     if self.allmap: return
                     end = self.datasize
                     self.allmap = 1
                     cur = 0
                     count = 0
                     blocksize = self.s * 256
                     self.dataf.seek(0)
                     while cur < end:
                         data = self.dataf.read(blocksize)
                         off = 0
                         for x in xrange(256):
                             n = data[off + self.shaoffset:off + self.shaoffset + 20]
                             self.map[n] = count
                             count += 1
                             if count >= self.l:
                                 break
                             off += self.s
                         cur += blocksize
                 def loadblock(self, blockstart, blocksize, data=None):
                     if self.all: return
                     if data is None:
                         self.dataf.seek(blockstart)
                         if blockstart + blocksize > self.datasize:
                             # the revlog may have grown since we've started running,
                             # but we don't have space in self.index for more entries.
                             # limit blocksize so that we don't get too much data.
                             blocksize = max(self.datasize - blockstart, 0)
                         data = self.dataf.read(blocksize)
                     lend = len(data) / self.s
                     i = blockstart / self.s
                     off = 0
                     # lazyindex supports __delitem__
                     if lend > len(self.index) - i:
                         lend = len(self.index) - i
                     for x in xrange(lend):
                         if self.index[i + x] == None:
                             b = data[off : off + self.s]
                             self.index[i + x] = b
                             n = b[self.shaoffset:self.shaoffset + 20]
                             self.map[n] = i + x
                         off += self.s
                 def findnode(self, node):
                     """search backwards through the index file for a specific node"""
                     if self.allmap: return None
                     # hg log will cause many many searches for the manifest
                     # nodes.  After we get called a few times, just load the whole
                     # thing.
                     if self.mapfind_count > 8:
                         self.loadmap()
                         if node in self.map:
                             return node
                         return None
                     self.mapfind_count += 1
                     last = self.l - 1
                     while self.index[last] != None:
                         if last == 0:
                             self.all = 1
                             self.allmap = 1
                             return None
                         last -= 1
                     end = (last + 1) * self.s
                     blocksize = self.s * 256
                     while end >= 0:
                         start = max(end - blocksize, 0)
                         self.dataf.seek(start)
                         data = self.dataf.read(end - start)
                         findend = end - start
                         while True:
                             # we're searching backwards, so weh have to make sure
                             # we don't find a changeset where this node is a parent
                             off = data.rfind(node, 0, findend)
                             findend = off
                             if off >= 0:
                                 i = off / self.s
                                 off = i * self.s
                                 n = data[off + self.shaoffset:off + self.shaoffset + 20]
                                 if n == node:
                                     self.map[n] = i + start / self.s
                                     return node
                             else:
                                 break
                         end -= blocksize
                     return None
                 def loadindex(self, i=None, end=None):
                     if self.all: return
                     all = False
                     if i == None:
                         blockstart = 0
                         blocksize = (512 / self.s) * self.s
                         end = self.datasize
                         all = True
                     else:
                         if end:
                             blockstart = i * self.s
                             end = end * self.s
                             blocksize = end - blockstart
                         else:
                             blockstart = (i & ~(32)) * self.s
                             blocksize = self.s * 64
                             end = blockstart + blocksize
                     while blockstart < end:
                         self.loadblock(blockstart, blocksize)
                         blockstart += blocksize
                     if all: self.all = True
             class lazyindex(object):
                 """a lazy version of the index array"""
                 def __init__(self, parser):
                     self.p = parser
                 def __len__(self):
                     return len(self.p.index)
                 def load(self, pos):
                     if pos < 0:
                         pos += len(self.p.index)
                     self.p.loadindex(pos)
                     return self.p.index[pos]
                 def __getitem__(self, pos):
                     ret = self.p.index[pos] or self.load(pos)
                     if isinstance(ret, str):
                         ret = struct.unpack(self.p.indexformat, ret)
                     return ret
                 def __setitem__(self, pos, item):
                     self.p.index[pos] = item
                 def __delitem__(self, pos):
                     del self.p.index[pos]
                 def append(self, e):
                     self.p.index.append(e)
             class lazymap(object):
                 """a lazy version of the node map"""
                 def __init__(self, parser):
                     self.p = parser
                 def load(self, key):
                     n = self.p.findnode(key)
                     if n == None:
                         raise KeyError(key)
                 def __contains__(self, key):
                     if key in self.p.map:
                         return True
                     self.p.loadmap()
                     return key in self.p.map
                 def __iter__(self):
                     yield nullid
                     for i in xrange(self.p.l):
                         ret = self.p.index[i]
                         if not ret:
                             self.p.loadindex(i)
                             ret = self.p.index[i]
                         if isinstance(ret, str):
                             ret = struct.unpack(self.p.indexformat, ret)
                         yield ret[-1]
                 def __getitem__(self, key):
                     try:
                         return self.p.map[key]
                     except KeyError:
                         try:
                             self.load(key)
                             return self.p.map[key]
                         except KeyError:
                             raise KeyError("node " + hex(key))
                 def __setitem__(self, key, val):
                     self.p.map[key] = val
                 def __delitem__(self, key):
                     del self.p.map[key]
             class RevlogError(Exception): pass
             class LookupError(RevlogError): pass
             class revlog(object):
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, includings its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 """
                 def __init__(self, opener, indexfile):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     """
                     self.indexfile = indexfile
                     self.datafile = indexfile[:-2] + ".d"
                     self.opener = opener
                     self.indexstat = None
                     self.cache = None
                     self.chunkcache = None
-                    self.defversion=REVLOG_DEFAULT_VERSION
+                    self.defversion = REVLOG_DEFAULT_VERSION
                     if hasattr(opener, "defversion"):
                         self.defversion = opener.defversion
                     self.load()
                 def load(self):
                     v = self.defversion
                     try:
                         f = self.opener(self.indexfile)
                         i = f.read(4)
                         f.seek(0)
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         i = ""
                     else:
                         try:
                             st = util.fstat(f)
                         except AttributeError, inst:
                             st = None
                         else:
                             oldst = self.indexstat
                             if (oldst and st.st_dev == oldst.st_dev
                                 and st.st_ino == oldst.st_ino
                                 and st.st_mtime == oldst.st_mtime
                                 and st.st_ctime == oldst.st_ctime):
                                 return
                             self.indexstat = st
                         if len(i) > 0:
                             v = struct.unpack(versionformat, i)[0]
                     flags = v & ~0xFFFF
                     fmt = v & 0xFFFF
                     if fmt == REVLOGV0:
                         if flags:
                             raise RevlogError(_("index %s unknown flags %#04x for format v0")
                                               % (self.indexfile, flags >> 16))
                     elif fmt == REVLOGNG:
                         if flags & ~REVLOGNGINLINEDATA:
                             raise RevlogError(_("index %s unknown flags %#04x for revlogng")
                                               % (self.indexfile, flags >> 16))
                     else:
                         raise RevlogError(_("index %s unknown format %d")
                                           % (self.indexfile, fmt))
                     self.version = v
                     if v == REVLOGV0:
                         self.indexformat = indexformatv0
                         shaoffset = v0shaoffset
                     else:
                         self.indexformat = indexformatng
                         shaoffset = ngshaoffset
                     if i:
                         if (lazyparser.safe_to_use and not self.inlinedata() and
                             st and st.st_size > 10000):
                             # big index, let's parse it on demand
                             parser = lazyparser(f, st.st_size, self.indexformat, shaoffset)
                             self.index = lazyindex(parser)
                             self.nodemap = lazymap(parser)
                         else:
                             self.parseindex(f, st)
                         if self.version != REVLOGV0:
                             e = list(self.index[0])
                             type = self.ngtype(e[0])
                             e[0] = self.offset_type(0, type)
                             self.index[0] = e
                     else:
                         self.nodemap = {nullid: nullrev}
                         self.index = []
                 def parseindex(self, fp, st):
                     s = struct.calcsize(self.indexformat)
                     self.index = []
                     self.nodemap =  {nullid: nullrev}
                     inline = self.inlinedata()
                     n = 0
                     leftover = None
                     while True:
                         if st:
                             data = fp.read(65536)
                         else:
                             # hack for httprangereader, it doesn't do partial reads well
                             data = fp.read()
                         if not data:
                             break
                         if n == 0 and self.inlinedata():
                             # cache the first chunk
                             self.chunkcache = (0, data)
                         if leftover:
                             data = leftover + data
                             leftover = None
                         off = 0
                         l = len(data)
                         while off < l:
                             if l - off < s:
                                 leftover = data[off:]
                                 break
                             cur = data[off:off + s]
                             off += s
                             e = struct.unpack(self.indexformat, cur)
                             self.index.append(e)
                             self.nodemap[e[-1]] = n
                             n += 1
                             if inline:
                                 if e[1] < 0:
                                     break
                                 off += e[1]
                                 if off > l:
                                     # some things don't seek well, just read it
                                     fp.read(off - l)
                                     break
                         if not st:
                             break
                 def ngoffset(self, q):
                     if q & 0xFFFF:
                         raise RevlogError(_('%s: incompatible revision flag %x') %
                                           (self.indexfile, q))
                     return long(q >> 16)
                 def ngtype(self, q):
                     return int(q & 0xFFFF)
                 def offset_type(self, offset, type):
                     return long(long(offset) << 16 | type)
                 def loadindex(self, start, end):
                     """load a block of indexes all at once from the lazy parser"""
                     if isinstance(self.index, lazyindex):
                         self.index.p.loadindex(start, end)
                 def loadindexmap(self):
                     """loads both the map and the index from the lazy parser"""
                     if isinstance(self.index, lazyindex):
                         p = self.index.p
                         p.loadindex()
                         self.nodemap = p.map
                 def loadmap(self):
                     """loads the map from the lazy parser"""
                     if isinstance(self.nodemap, lazymap):
                         self.nodemap.p.loadmap()
                         self.nodemap = self.nodemap.p.map
                 def inlinedata(self): return self.version & REVLOGNGINLINEDATA
                 def tip(self): return self.node(len(self.index) - 1)
                 def count(self): return len(self.index)
                 def node(self, rev):
                     return rev == nullrev and nullid or self.index[rev][-1]
                 def rev(self, node):
                     try:
                         return self.nodemap[node]
                     except KeyError:
                         raise LookupError(_('%s: no node %s') % (self.indexfile, hex(node)))
                 def linkrev(self, node):
                     return (node == nullid) and nullrev or self.index[self.rev(node)][-4]
                 def parents(self, node):
                     if node == nullid: return (nullid, nullid)
                     r = self.rev(node)
                     d = self.index[r][-3:-1]
                     if self.version == REVLOGV0:
                         return d
                     return (self.node(d[0]), self.node(d[1]))
                 def parentrevs(self, rev):
                     if rev == nullrev:
                         return (nullrev, nullrev)
                     d = self.index[rev][-3:-1]
                     if self.version == REVLOGV0:
                         return (self.rev(d[0]), self.rev(d[1]))
                     return d
                 def start(self, rev):
                     if rev == nullrev:
                         return 0
                     if self.version != REVLOGV0:
                         return self.ngoffset(self.index[rev][0])
                     return self.index[rev][0]
                 def end(self, rev): return self.start(rev) + self.length(rev)
                 def size(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     if rev == nullrev:
                         return 0
                     l = -1
                     if self.version != REVLOGV0:
                         l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.revision(self.node(rev))
                     return len(t)
                     # alternate implementation, The advantage to this code is it
                     # will be faster for a single revision.  But, the results are not
                     # cached, so finding the size of every revision will be slower.
                     """
                     if self.cache and self.cache[1] == rev:
                         return len(self.cache[2])
                     base = self.base(rev)
                     if self.cache and self.cache[1] >= base and self.cache[1] < rev:
                         base = self.cache[1]
                         text = self.cache[2]
                     else:
                         text = self.revision(self.node(base))
                     l = len(text)
                     for x in xrange(base + 1, rev + 1):
                         l = mdiff.patchedsize(l, self.chunk(x))
                     return l
                     """
                 def length(self, rev):
                     if rev == nullrev:
                         return 0
                     else:
                         return self.index[rev][1]
                 def base(self, rev):
                     if (rev == nullrev):
                         return nullrev
                     else:
                         return self.index[rev][-5]
                 def reachable(self, node, stop=None):
                     """return a hash of all nodes ancestral to a given node, including
                      the node itself, stopping when stop is matched"""
                     reachable = {}
                     visit = [node]
                     reachable[node] = 1
                     if stop:
                         stopn = self.rev(stop)
                     else:
                         stopn = 0
                     while visit:
                         n = visit.pop(0)
                         if n == stop:
                             continue
                         if n == nullid:
                             continue
                         for p in self.parents(n):
                             if self.rev(p) < stopn:
                                 continue
                             if p not in reachable:
                                 reachable[p] = 1
                                 visit.append(p)
                     return reachable
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a tuple containing three elements. Elements 1 and 2 contain
                     a final list bases and heads after all the unreachable ones have been
                     pruned.  Element 0 contains a topologically sorted list of all
                     nodes that satisfy these constraints:
 . All nodes must be descended from a node in roots (the nodes on
                        roots are considered descended from themselves).
 . All nodes must also be ancestors of a node in heads (the nodes in
                        heads are considered to be their own ancestors).
                     If roots is unspecified, nullid is assumed as the only root.
                     If heads is unspecified, it is taken to be the output of the
                     heads method (i.e. a list of all nodes in the repository that
                     have no children)."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [nullid] # Everybody's a descendent of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return ([self.node(r) for r in xrange(0, self.count())],
                                 [nullid], list(self.heads()))
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = self.count() - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = {}
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, 0)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = heads.keys()
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendent of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors[n] = 1 # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.extend([p for p in self.parents(n) if
                                                        p != nullid])
                                 elif n in heads: # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [n for n in roots if n in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(n) for n in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [nullid]
                     # Transform our roots list into a 'set' (i.e. a dictionary where the
                     # values don't matter.
                     descendents = dict.fromkeys(roots, 1)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendents.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descedents, empty parents will look like
                     # they're descendents.
                     for r in xrange(max(lowestrev, 0), highestrev + 1):
                         n = self.node(r)
                         isdescendent = False
                         if lowestrev == nullrev:  # Everybody is a descendent of nullid
                             isdescendent = True
                         elif n in descendents:
                             # n is already a descendent
                             isdescendent = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendents before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendents, it's not a root.
                                 if (p[0] in descendents) or (p[1] in descendents):
                                     roots.pop(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendent if either of its parents are
                             # descendents.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendents) or (p[1] in descendents):
                                 descendents[n] = 1
                                 isdescendent = True
                         if isdescendent and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendents and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = 1
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = 1
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [n for n in heads.iterkeys() if heads[n] != 0]
                     roots = roots.keys()
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None:
                         start = nullid
                     if stop is None:
                         stop = []
                     stoprevs = dict.fromkeys([self.rev(n) for n in stop])
                     startrev = self.rev(start)
                     reachable = {startrev: 1}
                     heads = {startrev: 1}
                     parentrevs = self.parentrevs
                     for r in xrange(startrev + 1, self.count()):
                         for p in parentrevs(r):
                             if p in reachable:
                                 if r not in stoprevs:
                                     reachable[r] = 1
                                 heads[r] = 1
                             if p in heads and p not in stoprevs:
                                 del heads[p]
                     return [self.node(r) for r in heads]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in range(p + 1, self.count()):
                         for pr in self.parentrevs(r):
                             if pr == p:
                                 c.append(self.node(r))
                     return c
                 def _match(self, id):
                     if isinstance(id, (long, int)):
                         # rev
                         return self.node(id)
                     if len(id) == 20:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             r = self.rev(node) # quick search the index
                             return node
                         except LookupError:
                             pass # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if str(rev) != id: raise ValueError
                         if rev < 0: rev = self.count() + rev
                         if rev < 0 or rev >= self.count(): raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 40:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             r = self.rev(node)
                             return node
                         except TypeError:
                             pass
                 def _partialmatch(self, id):
                     if len(id) < 40:
                         try:
                             # hex(node)[:...]
                             bin_id = bin(id[:len(id) & ~1]) # grab an even number of digits
                             node = None
                             for n in self.nodemap:
                                 if n.startswith(bin_id) and hex(n).startswith(id):
                                     if node is not None:
                                         raise LookupError(_("Ambiguous identifier"))
                                     node = n
                             if node is not None:
                                 return node
                         except TypeError:
                             pass
                 def lookup(self, id):
                     """locate a node based on:
                         - revision number or str(revision number)
                         - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise LookupError(_("No match found"))
                 def cmp(self, node, text):
                     """compare text with a given file revision"""
                     p1, p2 = self.parents(node)
                     return hash(text, p1, p2) != node
                 def makenode(self, node, text):
                     """calculate a file nodeid for text, descended or possibly
                     unchanged from node"""
                     if self.cmp(node, text):
                         return hash(text, node, nullid)
                     return node
                 def diff(self, a, b):
                     """return a delta between two revisions"""
                     return mdiff.textdiff(a, b)
                 def patches(self, t, pl):
                     """apply a list of patches to a string"""
                     return mdiff.patches(t, pl)
                 def chunk(self, rev, df=None, cachelen=4096):
                     start, length = self.start(rev), self.length(rev)
                     inline = self.inlinedata()
                     if inline:
                         start += (rev + 1) * struct.calcsize(self.indexformat)
                     end = start + length
                     def loadcache(df):
                         cache_length = max(cachelen, length) # 4k
                         if not df:
                             if inline:
                                 df = self.opener(self.indexfile)
                             else:
                                 df = self.opener(self.datafile)
                         df.seek(start)
                         self.chunkcache = (start, df.read(cache_length))
                     if not self.chunkcache:
                         loadcache(df)
                     cache_start = self.chunkcache[0]
                     cache_end = cache_start + len(self.chunkcache[1])
                     if start >= cache_start and end <= cache_end:
                         # it is cached
                         offset = start - cache_start
                     else:
                         loadcache(df)
                         offset = 0
                     #def checkchunk():
                     #    df = self.opener(self.datafile)
                     #    df.seek(start)
                     #    return df.read(length)
                     #assert s == checkchunk()
                     return decompress(self.chunkcache[1][offset:offset + length])
                 def delta(self, node):
                     """return or calculate a delta between a node and its predecessor"""
                     r = self.rev(node)
                     return self.revdiff(r - 1, r)
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions"""
                     b1 = self.base(rev1)
                     b2 = self.base(rev2)
                     if b1 == b2 and rev1 + 1 == rev2:
                         return self.chunk(rev2)
                     else:
                         return self.diff(self.revision(self.node(rev1)),
                                          self.revision(self.node(rev2)))
                 def revision(self, node):
                     """return an uncompressed revision of a given"""
                     if node == nullid: return ""
                     if self.cache and self.cache[0] == node: return self.cache[2]
                     # look up what we need to read
                     text = None
                     rev = self.rev(node)
                     base = self.base(rev)
                     if self.inlinedata():
                         # we probably have the whole chunk cached
                         df = None
                     else:
                         df = self.opener(self.datafile)
                     # do we have useful data cached?
                     if self.cache and self.cache[1] >= base and self.cache[1] < rev:
                         base = self.cache[1]
                         text = self.cache[2]
                         self.loadindex(base, rev + 1)
                     else:
                         self.loadindex(base, rev + 1)
                         text = self.chunk(base, df=df)
                     bins = []
                     for r in xrange(base + 1, rev + 1):
                         bins.append(self.chunk(r, df=df))
                     text = self.patches(text, bins)
                     p1, p2 = self.parents(node)
                     if node != hash(text, p1, p2):
                         raise RevlogError(_("integrity check failed on %s:%d")
                                           % (self.datafile, rev))
                     self.cache = (node, rev, text)
                     return text
                 def checkinlinesize(self, tr, fp=None):
                     if not self.inlinedata():
                         return
                     if not fp:
                         fp = self.opener(self.indexfile, 'r')
                         fp.seek(0, 2)
                     size = fp.tell()
                     if size < 131072:
                         return
                     trinfo = tr.find(self.indexfile)
                     if trinfo == None:
                         raise RevlogError(_("%s not found in the transaction")
                                           % self.indexfile)
                     trindex = trinfo[2]
                     dataoff = self.start(trindex)
                     tr.add(self.datafile, dataoff)
                     df = self.opener(self.datafile, 'w')
                     calc = struct.calcsize(self.indexformat)
                     for r in xrange(self.count()):
                         start = self.start(r) + (r + 1) * calc
                         length = self.length(r)
                         fp.seek(start)
                         d = fp.read(length)
                         df.write(d)
                     fp.close()
                     df.close()
                     fp = self.opener(self.indexfile, 'w', atomictemp=True)
                     self.version &= ~(REVLOGNGINLINEDATA)
                     if self.count():
                         x = self.index[0]
                         e = struct.pack(self.indexformat, *x)[4:]
                         l = struct.pack(versionformat, self.version)
                         fp.write(l)
                         fp.write(e)
                     for i in xrange(1, self.count()):
                         x = self.index[i]
                         e = struct.pack(self.indexformat, *x)
                         fp.write(e)
                     # if we don't call rename, the temp file will never replace the
                     # real index
                     fp.rename()
                     tr.replace(self.indexfile, trindex * calc)
                     self.chunkcache = None
                 def addrevision(self, text, transaction, link, p1=None, p2=None, d=None):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     d - an optional precomputed delta
                     """
                     if not self.inlinedata():
                         dfh = self.opener(self.datafile, "a")
                     else:
                         dfh = None
                     ifh = self.opener(self.indexfile, "a+")
                     return self._addrevision(text, transaction, link, p1, p2, d, ifh, dfh)
                 def _addrevision(self, text, transaction, link, p1, p2, d, ifh, dfh):
                     if text is None: text = ""
                     if p1 is None: p1 = self.tip()
                     if p2 is None: p2 = nullid
                     node = hash(text, p1, p2)
                     if node in self.nodemap:
                         return node
                     n = self.count()
                     t = n - 1
                     if n:
                         base = self.base(t)
                         start = self.start(base)
                         end = self.end(t)
                         if not d:
                             prev = self.revision(self.tip())
                             d = self.diff(prev, text)
                         data = compress(d)
                         l = len(data[1]) + len(data[0])
                         dist = end - start + l
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if not n or dist > len(text) * 2:
                         data = compress(text)
                         l = len(data[1]) + len(data[0])
                         base = n
                     else:
                         base = self.base(t)
                     offset = 0
                     if t >= 0:
                         offset = self.end(t)
                     if self.version == REVLOGV0:
                         e = (offset, l, base, link, p1, p2, node)
                     else:
                         e = (self.offset_type(offset, 0), l, len(text),
                              base, link, self.rev(p1), self.rev(p2), node)
                     self.index.append(e)
                     self.nodemap[node] = n
                     entry = struct.pack(self.indexformat, *e)
                     if not self.inlinedata():
                         transaction.add(self.datafile, offset)
                         transaction.add(self.indexfile, n * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         dfh.flush()
                     else:
                         ifh.seek(0, 2)
                         transaction.add(self.indexfile, ifh.tell(), self.count() - 1)
                     if len(self.index) == 1 and self.version != REVLOGV0:
                         l = struct.pack(versionformat, self.version)
                         ifh.write(l)
                         entry = entry[4:]
                     ifh.write(entry)
                     if self.inlinedata():
                         ifh.write(data[0])
                         ifh.write(data[1])
                         self.checkinlinesize(transaction, ifh)
                     self.cache = (node, n, text)
                     return node
                 def ancestor(self, a, b):
                     """calculate the least common ancestor of nodes a and b"""
                     def parents(rev):
                         return [p for p in self.parentrevs(rev) if p != nullrev]
                     c = ancestor.ancestor(self.rev(a), self.rev(b), parents)
                     if c is None:
                         return nullid
                     return self.node(c)
                 def group(self, nodelist, lookup, infocollect=None):
                     """calculate a delta group
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. the first delta is
                     parent(nodes[0]) -> nodes[0] the receiver is guaranteed to
                     have this parent as it has all history before these
                     changesets. parent is parent[0]
                     """
                     revs = [self.rev(n) for n in nodelist]
                     # if we don't have any revisions touched by these changesets, bail
                     if not revs:
                         yield changegroup.closechunk()
                         return
                     # add the parent of the first rev
                     p = self.parents(self.node(revs[0]))[0]
                     revs.insert(0, self.rev(p))
                     # build deltas
                     for d in xrange(0, len(revs) - 1):
                         a, b = revs[d], revs[d + 1]
                         nb = self.node(b)
                         if infocollect is not None:
                             infocollect(nb)
                         d = self.revdiff(a, b)
                         p = self.parents(nb)
                         meta = nb + p[0] + p[1] + lookup(nb)
                         yield changegroup.genchunk("%s%s" % (meta, d))
                     yield changegroup.closechunk()
                 def addgroup(self, revs, linkmapper, transaction, unique=0):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     """
                     #track the base of the current delta log
                     r = self.count()
                     t = r - 1
                     node = None
                     base = prev = nullrev
                     start = end = textlen = 0
                     if r:
                         end = self.end(t)
                     ifh = self.opener(self.indexfile, "a+")
                     ifh.seek(0, 2)
                     transaction.add(self.indexfile, ifh.tell(), self.count())
                     if self.inlinedata():
                         dfh = None
                     else:
                         transaction.add(self.datafile, end)
                         dfh = self.opener(self.datafile, "a")
                     # loop through our set of deltas
                     chain = None
                     for chunk in revs:
                         node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80])
                         link = linkmapper(cs)
                         if node in self.nodemap:
                             # this can happen if two branches make the same change
                             # if unique:
                             #    raise RevlogError(_("already have %s") % hex(node[:4]))
                             chain = node
                             continue
                         delta = chunk[80:]
                         for p in (p1, p2):
                             if not p in self.nodemap:
                                 raise LookupError(_("unknown parent %s") % short(p))
                         if not chain:
                             # retrieve the parent revision of the delta chain
                             chain = p1
                             if not chain in self.nodemap:
                                 raise LookupError(_("unknown base %s") % short(chain[:4]))
                         # full versions are inserted when the needed deltas become
                         # comparable to the uncompressed text or when the previous
                         # version is not the one we have a delta against. We use
                         # the size of the previous full rev as a proxy for the
                         # current size.
                         if chain == prev:
                             tempd = compress(delta)
                             cdelta = tempd[0] + tempd[1]
                             textlen = mdiff.patchedsize(textlen, delta)
                         if chain != prev or (end - start + len(cdelta)) > textlen * 2:
                             # flush our writes here so we can read it in revision
                             if dfh:
                                 dfh.flush()
                             ifh.flush()
                             text = self.revision(chain)
                             text = self.patches(text, [delta])
                             chk = self._addrevision(text, transaction, link, p1, p2, None,
                                                     ifh, dfh)
                             if not dfh and not self.inlinedata():
                                 # addrevision switched from inline to conventional
                                 # reopen the index
                                 dfh = self.opener(self.datafile, "a")
                                 ifh = self.opener(self.indexfile, "a")
                             if chk != node:
                                 raise RevlogError(_("consistency error adding group"))
                             textlen = len(text)
                         else:
                             if self.version == REVLOGV0:
                                 e = (end, len(cdelta), base, link, p1, p2, node)
                             else:
                                 e = (self.offset_type(end, 0), len(cdelta), textlen, base,
                                      link, self.rev(p1), self.rev(p2), node)
                             self.index.append(e)
                             self.nodemap[node] = r
                             if self.inlinedata():
                                 ifh.write(struct.pack(self.indexformat, *e))
                                 ifh.write(cdelta)
                                 self.checkinlinesize(transaction, ifh)
                                 if not self.inlinedata():
                                     dfh = self.opener(self.datafile, "a")
                                     ifh = self.opener(self.indexfile, "a")
                             else:
                                 dfh.write(cdelta)
                                 ifh.write(struct.pack(self.indexformat, *e))
                         t, r, chain, prev = r, r + 1, node, node
                         base = self.base(t)
                         start = self.start(base)
                         end = self.end(t)
                     return node
                 def strip(self, rev, minlink):
                     if self.count() == 0 or rev >= self.count():
                         return
                     if isinstance(self.index, lazyindex):
                         self.loadindexmap()
                     # When stripping away a revision, we need to make sure it
                     # does not actually belong to an older changeset.
                     # The minlink parameter defines the oldest revision
                     # we're allowed to strip away.
                     while minlink > self.index[rev][-4]:
                         rev += 1
                         if rev >= self.count():
                             return
                     # first truncate the files on disk
                     end = self.start(rev)
                     if not self.inlinedata():
                         df = self.opener(self.datafile, "a")
                         df.truncate(end)
                         end = rev * struct.calcsize(self.indexformat)
                     else:
                         end += rev * struct.calcsize(self.indexformat)
                     indexf = self.opener(self.indexfile, "a")
                     indexf.truncate(end)
                     # then reset internal state in memory to forget those revisions
                     self.cache = None
                     self.chunkcache = None
                     for x in xrange(rev, self.count()):
                         del self.nodemap[self.node(x)]
                     del self.index[rev:]
                 def checksize(self):
                     expected = 0
                     if self.count():
                         expected = self.end(self.count() - 1)
                     try:
                         f = self.opener(self.datafile)
                         f.seek(0, 2)
                         actual = f.tell()
                         dd = actual - expected
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         dd = 0
                     try:
                         f = self.opener(self.indexfile)
                         f.seek(0, 2)
                         actual = f.tell()
                         s = struct.calcsize(self.indexformat)
                         i = actual / s
                         di = actual - (i * s)
                         if self.inlinedata():
                             databytes = 0
                             for r in xrange(self.count()):
                                 databytes += self.length(r)
                             dd = 0
                             di = actual - self.count() * s - databytes
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         di = 0
                     return (dd, di)