upstream/mercurial-mirror Commit - r4989:1aaed3d6

1

"""

1

"""

2

revlog.py - storage back-end for mercurial

2

revlog.py - storage back-end for mercurial

3

4

This provides efficient delta storage with O(1) retrieve and append

4

This provides efficient delta storage with O(1) retrieve and append

5

and O(changes) merge between branches

5

and O(changes) merge between branches

6

7

8

9

This software may be used and distributed according to the terms

9

This software may be used and distributed according to the terms

10

of the GNU General Public License, incorporated herein by reference.

10

of the GNU General Public License, incorporated herein by reference.

11

"""

11

"""

12

13

from node import *

13

from node import *

14

from i18n import _

14

from i18n import _

15

import binascii, changegroup, errno, ancestor, mdiff, os

15

import binascii, changegroup, errno, ancestor, mdiff, os

16

import sha, struct, util, zlib

16

import sha, struct, util, zlib

17

18

# revlog flags

18

# revlog flags

19

REVLOGV0 = 0

19

REVLOGV0 = 0

20

REVLOGNG = 1

20

REVLOGNG = 1

21

REVLOGNGINLINEDATA = (1 << 16)

21

REVLOGNGINLINEDATA = (1 << 16)

22

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

22

REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA

23

REVLOG_DEFAULT_FORMAT = REVLOGNG

23

REVLOG_DEFAULT_FORMAT = REVLOGNG

24

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

24

REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS

25

26

class RevlogError(Exception):

26

class RevlogError(Exception):

27

pass

27

pass

28

class LookupError(RevlogError):

28

class LookupError(RevlogError):

29

pass

29

pass

30

31

def getoffset(q):

31

def getoffset(q):

32

if q & 0xFFFF:

32

if q & 0xFFFF:

33

raise RevlogError(_('incompatible revision flag %x') % q)

33

raise RevlogError(_('incompatible revision flag %x') % q)

34

return int(q >> 16)

34

return int(q >> 16)

35

36

def gettype(q):

36

def gettype(q):

37

return int(q & 0xFFFF)

37

return int(q & 0xFFFF)

38

39

def offset_type(offset, type):

39

def offset_type(offset, type):

40

return long(long(offset) << 16 | type)

40

return long(long(offset) << 16 | type)

41

42

def hash(text, p1, p2):

42

def hash(text, p1, p2):

43

"""generate a hash from the given text and its parent hashes

43

"""generate a hash from the given text and its parent hashes

44

45

This hash combines both the current file contents and its history

45

This hash combines both the current file contents and its history

46

in a manner that makes it easy to distinguish nodes with the same

46

in a manner that makes it easy to distinguish nodes with the same

47

content in the revision graph.

47

content in the revision graph.

48

"""

48

"""

49

l = [p1, p2]

49

l = [p1, p2]

50

l.sort()

50

l.sort()

51

s = sha.new(l[0])

51

s = sha.new(l[0])

52

s.update(l[1])

52

s.update(l[1])

53

s.update(text)

53

s.update(text)

54

return s.digest()

54

return s.digest()

55

56

def compress(text):

56

def compress(text):

57

""" generate a possibly-compressed representation of text """

57

""" generate a possibly-compressed representation of text """

58

if not text:

58

if not text:

59

return ("", text)

59

return ("", text)

60

if len(text) < 44:

60

if len(text) < 44:

61

if text[0] == '\0':

61

if text[0] == '\0':

62

return ("", text)

62

return ("", text)

63

return ('u', text)

63

return ('u', text)

64

bin = zlib.compress(text)

64

bin = zlib.compress(text)

65

if len(bin) > len(text):

65

if len(bin) > len(text):

66

if text[0] == '\0':

66

if text[0] == '\0':

67

return ("", text)

67

return ("", text)

68

return ('u', text)

68

return ('u', text)

69

return ("", bin)

69

return ("", bin)

70

71

def decompress(bin):

71

def decompress(bin):

72

""" decompress the given input """

72

""" decompress the given input """

73

if not bin:

73

if not bin:

74

return bin

74

return bin

75

t = bin[0]

75

t = bin[0]

76

if t == '\0':

76

if t == '\0':

77

return bin

77

return bin

78

if t == 'x':

78

if t == 'x':

79

return zlib.decompress(bin)

79

return zlib.decompress(bin)

80

if t == 'u':

80

if t == 'u':

81

return bin[1:]

81

return bin[1:]

82

raise RevlogError(_("unknown compression type %r") % t)

82

raise RevlogError(_("unknown compression type %r") % t)

83

84

class lazyparser(object):

84

class lazyparser(object):

85

"""

85

"""

86

this class avoids the need to parse the entirety of large indices

86

this class avoids the need to parse the entirety of large indices

87

"""

87

"""

88

89

# lazyparser is not safe to use on windows if win32 extensions not

89

# lazyparser is not safe to use on windows if win32 extensions not

90

# available. it keeps file handle open, which make it not possible

90

# available. it keeps file handle open, which make it not possible

91

# to break hardlinks on local cloned repos.

91

# to break hardlinks on local cloned repos.

92

safe_to_use = os.name != 'nt' or (not util.is_win_9x() and

92

safe_to_use = os.name != 'nt' or (not util.is_win_9x() and

93

hasattr(util, 'win32api'))

93

hasattr(util, 'win32api'))

94

95

def __init__(self, dataf, size):

95

def __init__(self, dataf, size):

96

self.dataf = dataf

96

self.dataf = dataf

97

self.s = struct.calcsize(indexformatng)

97

self.s = struct.calcsize(indexformatng)

98

self.datasize = size

98

self.datasize = size

99

self.l = size/self.s

99

self.l = size/self.s

100

self.index = [None] * self.l

100

self.index = [None] * self.l

101

self.map = {nullid: nullrev}

101

self.map = {nullid: nullrev}

102

self.allmap = 0

102

self.allmap = 0

103

self.all = 0

103

self.all = 0

104

self.mapfind_count = 0

104

self.mapfind_count = 0

105

106

def loadmap(self):

106

def loadmap(self):

107

"""

107

"""

108

during a commit, we need to make sure the rev being added is

108

during a commit, we need to make sure the rev being added is

109

not a duplicate. This requires loading the entire index,

109

not a duplicate. This requires loading the entire index,

110

which is fairly slow. loadmap can load up just the node map,

110

which is fairly slow. loadmap can load up just the node map,

111

which takes much less time.

111

which takes much less time.

112

"""

112

"""

113

if self.allmap:

113

if self.allmap:

114

return

114

return

115

end = self.datasize

115

end = self.datasize

116

self.allmap = 1

116

self.allmap = 1

117

cur = 0

117

cur = 0

118

count = 0

118

count = 0

119

blocksize = self.s * 256

119

blocksize = self.s * 256

120

self.dataf.seek(0)

120

self.dataf.seek(0)

121

while cur < end:

121

while cur < end:

122

data = self.dataf.read(blocksize)

122

data = self.dataf.read(blocksize)

123

off = 0

123

off = 0

124

for x in xrange(256):

124

for x in xrange(256):

125

n = data[off + ngshaoffset:off + ngshaoffset + 20]

125

n = data[off + ngshaoffset:off + ngshaoffset + 20]

126

self.map[n] = count

126

self.map[n] = count

127

count += 1

127

count += 1

128

if count >= self.l:

128

if count >= self.l:

129

break

129

break

130

off += self.s

130

off += self.s

131

cur += blocksize

131

cur += blocksize

132

133

def loadblock(self, blockstart, blocksize, data=None):

133

def loadblock(self, blockstart, blocksize, data=None):

134

if self.all:

134

if self.all:

135

return

135

return

136

if data is None:

136

if data is None:

137

self.dataf.seek(blockstart)

137

self.dataf.seek(blockstart)

138

if blockstart + blocksize > self.datasize:

138

if blockstart + blocksize > self.datasize:

139

# the revlog may have grown since we've started running,

139

# the revlog may have grown since we've started running,

140

# but we don't have space in self.index for more entries.

140

# but we don't have space in self.index for more entries.

141

# limit blocksize so that we don't get too much data.

141

# limit blocksize so that we don't get too much data.

142

blocksize = max(self.datasize - blockstart, 0)

142

blocksize = max(self.datasize - blockstart, 0)

143

data = self.dataf.read(blocksize)

143

data = self.dataf.read(blocksize)

144

lend = len(data) / self.s

144

lend = len(data) / self.s

145

i = blockstart / self.s

145

i = blockstart / self.s

146

off = 0

146

off = 0

147

# lazyindex supports __delitem__

147

# lazyindex supports __delitem__

148

if lend > len(self.index) - i:

148

if lend > len(self.index) - i:

149

lend = len(self.index) - i

149

lend = len(self.index) - i

150

for x in xrange(lend):

150

for x in xrange(lend):

151

if self.index[i + x] == None:

151

if self.index[i + x] == None:

152

b = data[off : off + self.s]

152

b = data[off : off + self.s]

153

self.index[i + x] = b

153

self.index[i + x] = b

154

n = b[ngshaoffset:ngshaoffset + 20]

154

n = b[ngshaoffset:ngshaoffset + 20]

155

self.map[n] = i + x

155

self.map[n] = i + x

156

off += self.s

156

off += self.s

157

158

def findnode(self, node):

158

def findnode(self, node):

159

"""search backwards through the index file for a specific node"""

159

"""search backwards through the index file for a specific node"""

160

if self.allmap:

160

if self.allmap:

161

return None

161

return None

162

163

# hg log will cause many many searches for the manifest

163

# hg log will cause many many searches for the manifest

164

# nodes. After we get called a few times, just load the whole

164

# nodes. After we get called a few times, just load the whole

165

# thing.

165

# thing.

166

if self.mapfind_count > 8:

166

if self.mapfind_count > 8:

167

self.loadmap()

167

self.loadmap()

168

if node in self.map:

168

if node in self.map:

169

return node

169

return node

170

return None

170

return None

171

self.mapfind_count += 1

171

self.mapfind_count += 1

172

last = self.l - 1

172

last = self.l - 1

173

while self.index[last] != None:

173

while self.index[last] != None:

174

if last == 0:

174

if last == 0:

175

self.all = 1

175

self.all = 1

176

self.allmap = 1

176

self.allmap = 1

177

return None

177

return None

178

last -= 1

178

last -= 1

179

end = (last + 1) * self.s

179

end = (last + 1) * self.s

180

blocksize = self.s * 256

180

blocksize = self.s * 256

181

while end >= 0:

181

while end >= 0:

182

start = max(end - blocksize, 0)

182

start = max(end - blocksize, 0)

183

self.dataf.seek(start)

183

self.dataf.seek(start)

184

data = self.dataf.read(end - start)

184

data = self.dataf.read(end - start)

185

findend = end - start

185

findend = end - start

186

while True:

186

while True:

187

# we're searching backwards, so weh have to make sure

187

# we're searching backwards, so weh have to make sure

188

# we don't find a changeset where this node is a parent

188

# we don't find a changeset where this node is a parent

189

off = data.rfind(node, 0, findend)

189

off = data.rfind(node, 0, findend)

190

findend = off

190

findend = off

191

if off >= 0:

191

if off >= 0:

192

i = off / self.s

192

i = off / self.s

193

off = i * self.s

193

off = i * self.s

194

n = data[off + ngshaoffset:off + ngshaoffset + 20]

194

n = data[off + ngshaoffset:off + ngshaoffset + 20]

195

if n == node:

195

if n == node:

196

self.map[n] = i + start / self.s

196

self.map[n] = i + start / self.s

197

return node

197

return node

198

else:

198

else:

199

break

199

break

200

end -= blocksize

200

end -= blocksize

201

return None

201

return None

202

203

def loadindex(self, i=None, end=None):

203

def loadindex(self, i=None, end=None):

204

if self.all:

204

if self.all:

205

return

205

return

206

all = False

206

all = False

207

if i == None:

207

if i == None:

208

blockstart = 0

208

blockstart = 0

209

blocksize = (512 / self.s) * self.s

209

blocksize = (512 / self.s) * self.s

210

end = self.datasize

210

end = self.datasize

211

all = True

211

all = True

212

else:

212

else:

213

if end:

213

if end:

214

blockstart = i * self.s

214

blockstart = i * self.s

215

end = end * self.s

215

end = end * self.s

216

blocksize = end - blockstart

216

blocksize = end - blockstart

217

else:

217

else:

218

blockstart = (i & ~63) * self.s

218

blockstart = (i & ~63) * self.s

219

blocksize = self.s * 64

219

blocksize = self.s * 64

220

end = blockstart + blocksize

220

end = blockstart + blocksize

221

while blockstart < end:

221

while blockstart < end:

222

self.loadblock(blockstart, blocksize)

222

self.loadblock(blockstart, blocksize)

223

blockstart += blocksize

223

blockstart += blocksize

224

if all:

224

if all:

225

self.all = True

225

self.all = True

226

227

class lazyindex(object):

227

class lazyindex(object):

228

"""a lazy version of the index array"""

228

"""a lazy version of the index array"""

229

def __init__(self, parser):

229

def __init__(self, parser):

230

self.p = parser

230

self.p = parser

231

def __len__(self):

231

def __len__(self):

232

return len(self.p.index)

232

return len(self.p.index)

233

def load(self, pos):

233

def load(self, pos):

234

if pos < 0:

234

if pos < 0:

235

pos += len(self.p.index)

235

pos += len(self.p.index)

236

self.p.loadindex(pos)

236

self.p.loadindex(pos)

237

return self.p.index[pos]

237

return self.p.index[pos]

238

def __getitem__(self, pos):

238

def __getitem__(self, pos):

239

ret = self.p.index[pos] or self.load(pos)

239

ret = self.p.index[pos] or self.load(pos)

240

if isinstance(ret, str):

240

if isinstance(ret, str):

241

ret = struct.unpack(indexformatng, ret)

241

ret = struct.unpack(indexformatng, ret)

242

return ret

242

return ret

243

def __setitem__(self, pos, item):

243

def __setitem__(self, pos, item):

244

self.p.index[pos] = item

244

self.p.index[pos] = item

245

def __delitem__(self, pos):

245

def __delitem__(self, pos):

246

del self.p.index[pos]

246

del self.p.index[pos]

247

def insert(self, pos, e):

247

def insert(self, pos, e):

248

self.p.index.insert(pos, e)

248

self.p.index.insert(pos, e)

249

def append(self, e):

249

def append(self, e):

250

self.p.index.append(e)

250

self.p.index.append(e)

251

252

class lazymap(object):

252

class lazymap(object):

253

"""a lazy version of the node map"""

253

"""a lazy version of the node map"""

254

def __init__(self, parser):

254

def __init__(self, parser):

255

self.p = parser

255

self.p = parser

256

def load(self, key):

256

def load(self, key):

257

n = self.p.findnode(key)

257

n = self.p.findnode(key)

258

if n == None:

258

if n == None:

259

raise KeyError(key)

259

raise KeyError(key)

260

def __contains__(self, key):

260

def __contains__(self, key):

261

if key in self.p.map:

261

if key in self.p.map:

262

return True

262

return True

263

self.p.loadmap()

263

self.p.loadmap()

264

return key in self.p.map

264

return key in self.p.map

265

def __iter__(self):

265

def __iter__(self):

266

yield nullid

266

yield nullid

267

for i in xrange(self.p.l):

267

for i in xrange(self.p.l):

268

ret = self.p.index[i]

268

ret = self.p.index[i]

269

if not ret:

269

if not ret:

270

self.p.loadindex(i)

270

self.p.loadindex(i)

271

ret = self.p.index[i]

271

ret = self.p.index[i]

272

if isinstance(ret, str):

272

if isinstance(ret, str):

273

ret = struct.unpack(indexformatng, ret)

273

ret = struct.unpack(indexformatng, ret)

274

yield ret[7]

274

yield ret[7]

275

def __getitem__(self, key):

275

def __getitem__(self, key):

276

try:

276

try:

277

return self.p.map[key]

277

return self.p.map[key]

278

except KeyError:

278

except KeyError:

279

try:

279

try:

280

self.load(key)

280

self.load(key)

281

return self.p.map[key]

281

return self.p.map[key]

282

except KeyError:

282

except KeyError:

283

raise KeyError("node " + hex(key))

283

raise KeyError("node " + hex(key))

284

def __setitem__(self, key, val):

284

def __setitem__(self, key, val):

285

self.p.map[key] = val

285

self.p.map[key] = val

286

def __delitem__(self, key):

286

def __delitem__(self, key):

287

del self.p.map[key]

287

del self.p.map[key]

288

289

indexformatv0 = ">4l20s20s20s"

289

indexformatv0 = ">4l20s20s20s"

290

v0shaoffset = 56

290

v0shaoffset = 56

291

292

class revlogoldio(object):

292

class revlogoldio(object):

293

def __init__(self):

293

def __init__(self):

294

self.size = struct.calcsize(indexformatv0)

294

self.size = struct.calcsize(indexformatv0)

295

296

def parseindex(self, fp, inline):

296

def parseindex(self, fp, inline):

297

s = self.size

297

s = self.size

298

index = []

298

index = []

299

nodemap = {nullid: nullrev}

299

nodemap = {nullid: nullrev}

300

n = off = 0

300

n = off = 0

301

data = fp.read()

301

data = fp.read()

302

l = len(data)

302

l = len(data)

303

while off + s <= l:

303

while off + s <= l:

304

cur = data[off:off + s]

304

cur = data[off:off + s]

305

off += s

305

off += s

306

e = struct.unpack(indexformatv0, cur)

306

e = struct.unpack(indexformatv0, cur)

307

# transform to revlogv1 format

307

# transform to revlogv1 format

308

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

308

e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],

309

nodemap[e[4]], nodemap[e[5]], e[6])

309

nodemap[e[4]], nodemap[e[5]], e[6])

310

index.append(e2)

310

index.append(e2)

311

nodemap[e[6]] = n

311

nodemap[e[6]] = n

312

n += 1

312

n += 1

313

314

return index, nodemap, None

314

return index, nodemap, None

315

316

def packentry(self, entry, node, version):

316

def packentry(self, entry, node, version):

317

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

317

e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],

318

node(entry[5]), node(entry[6]), entry[7])

318

node(entry[5]), node(entry[6]), entry[7])

319

return struct.pack(indexformatv0, *e2)

319

return struct.pack(indexformatv0, *e2)

320

321

# index ng:

321

# index ng:

322

# 6 bytes offset

322

# 6 bytes offset

323

# 2 bytes flags

323

# 2 bytes flags

324

# 4 bytes compressed length

324

# 4 bytes compressed length

325

# 4 bytes uncompressed length

325

# 4 bytes uncompressed length

326

# 4 bytes: base rev

326

# 4 bytes: base rev

327

# 4 bytes link rev

327

# 4 bytes link rev

328

# 4 bytes parent 1 rev

328

# 4 bytes parent 1 rev

329

# 4 bytes parent 2 rev

329

# 4 bytes parent 2 rev

330

# 32 bytes: nodeid

330

# 32 bytes: nodeid

331

indexformatng = ">Qiiiiii20s12x"

331

indexformatng = ">Qiiiiii20s12x"

332

ngshaoffset = 32

332

ngshaoffset = 32

333

versionformat = ">I"

333

versionformat = ">I"

334

335

class revlogio(object):

335

class revlogio(object):

336

def __init__(self):

336

def __init__(self):

337

self.size = struct.calcsize(indexformatng)

337

self.size = struct.calcsize(indexformatng)

338

339

def parseindex(self, fp, inline):

339

def parseindex(self, fp, inline):

340

try:

340

try:

341

size = util.fstat(fp).st_size

341

size = util.fstat(fp).st_size

342

except AttributeError:

342

except AttributeError:

343

size = 0

343

size = 0

344

345

if lazyparser.safe_to_use and not inline and size > 1000000:

345

if lazyparser.safe_to_use and not inline and size > 1000000:

346

# big index, let's parse it on demand

346

# big index, let's parse it on demand

347

parser = lazyparser(fp, size)

347

parser = lazyparser(fp, size)

348

index = lazyindex(parser)

348

index = lazyindex(parser)

349

nodemap = lazymap(parser)

349

nodemap = lazymap(parser)

350

e = list(index[0])

350

e = list(index[0])

351

type = gettype(e[0])

351

type = gettype(e[0])

352

e[0] = offset_type(0, type)

352

e[0] = offset_type(0, type)

353

index[0] = e

353

index[0] = e

354

return index, nodemap, None

354

return index, nodemap, None

355

356

s = self.size

356

s = self.size

357

cache = None

357

cache = None

358

index = []

358

index = []

359

nodemap = {nullid: nullrev}

359

nodemap = {nullid: nullrev}

360

n = off = 0

360

n = off = 0

361

# if we're not using lazymap, always read the whole index

361

# if we're not using lazymap, always read the whole index

362

data = fp.read()

362

data = fp.read()

363

l = len(data)

363

l = len(data)

364

if inline:

364

if inline:

365

cache = (0, data)

365

cache = (0, data)

366

while off + s <= l:

366

while off + s <= l:

367

e = struct.unpack(indexformatng, data[off:off + s])

367

e = struct.unpack(indexformatng, data[off:off + s])

368

index.append(e)

368

index.append(e)

369

nodemap[e[7]] = n

369

nodemap[e[7]] = n

370

n += 1

370

n += 1

371

off += s

371

off += s

372

if inline:

372

if inline:

373

if e[1] < 0:

373

if e[1] < 0:

374

break

374

break

375

off += e[1]

375

off += e[1]

376

377

e = list(index[0])

377

e = list(index[0])

378

type = gettype(e[0])

378

type = gettype(e[0])

379

e[0] = offset_type(0, type)

379

e[0] = offset_type(0, type)

380

index[0] = e

380

index[0] = e

381

382

return index, nodemap, cache

382

return index, nodemap, cache

383

384

def packentry(self, entry, node, version):

384

def packentry(self, entry, node, version):

385

p = struct.pack(indexformatng, *entry)

385

p = struct.pack(indexformatng, *entry)

386

if not entry[3] and not getoffset(entry[0]) and entry[5] == nullrev:

386

if not entry[3] and not getoffset(entry[0]) and entry[5] == nullrev:

387

p = struct.pack(versionformat, version) + p[4:]

387

p = struct.pack(versionformat, version) + p[4:]

388

return p

388

return p

389

390

class revlog(object):

390

class revlog(object):

391

"""

391

"""

392

the underlying revision storage object

392

the underlying revision storage object

393

394

A revlog consists of two parts, an index and the revision data.

394

A revlog consists of two parts, an index and the revision data.

395

396

The index is a file with a fixed record size containing

396

The index is a file with a fixed record size containing

397

information on each revision, includings its nodeid (hash), the

397

information on each revision, includings its nodeid (hash), the

398

nodeids of its parents, the position and offset of its data within

398

nodeids of its parents, the position and offset of its data within

399

the data file, and the revision it's based on. Finally, each entry

399

the data file, and the revision it's based on. Finally, each entry

400

contains a linkrev entry that can serve as a pointer to external

400

contains a linkrev entry that can serve as a pointer to external

401

data.

401

data.

402

403

The revision data itself is a linear collection of data chunks.

403

The revision data itself is a linear collection of data chunks.

404

Each chunk represents a revision and is usually represented as a

404

Each chunk represents a revision and is usually represented as a

405

delta against the previous chunk. To bound lookup time, runs of

405

delta against the previous chunk. To bound lookup time, runs of

406

deltas are limited to about 2 times the length of the original

406

deltas are limited to about 2 times the length of the original

407

version data. This makes retrieval of a version proportional to

407

version data. This makes retrieval of a version proportional to

408

its size, or O(1) relative to the number of revisions.

408

its size, or O(1) relative to the number of revisions.

409

410

Both pieces of the revlog are written to in an append-only

410

Both pieces of the revlog are written to in an append-only

411

fashion, which means we never need to rewrite a file to insert or

411

fashion, which means we never need to rewrite a file to insert or

412

remove data, and can use some simple techniques to avoid the need

412

remove data, and can use some simple techniques to avoid the need

413

for locking while reading.

413

for locking while reading.

414

"""

414

"""

415

def __init__(self, opener, indexfile):

415

def __init__(self, opener, indexfile):

416

"""

416

"""

417

create a revlog object

417

create a revlog object

418

419

opener is a function that abstracts the file opening operation

419

opener is a function that abstracts the file opening operation

420

and can be used to implement COW semantics or the like.

420

and can be used to implement COW semantics or the like.

421

"""

421

"""

422

self.indexfile = indexfile

422

self.indexfile = indexfile

423

self.datafile = indexfile[:-2] + ".d"

423

self.datafile = indexfile[:-2] + ".d"

424

self.opener = opener

424

self.opener = opener

425

self._cache = None

425

self._cache = None

426

self._chunkcache = None

426

self._chunkcache = None

427

self.nodemap = {nullid: nullrev}

427

self.nodemap = {nullid: nullrev}

428

self.index = []

428

self.index = []

429

430

v = REVLOG_DEFAULT_VERSION

430

v = REVLOG_DEFAULT_VERSION

431

if hasattr(opener, "defversion"):

431

if hasattr(opener, "defversion"):

432

v = opener.defversion

432

v = opener.defversion

433

if v & REVLOGNG:

433

if v & REVLOGNG:

434

v |= REVLOGNGINLINEDATA

434

v |= REVLOGNGINLINEDATA

435

436

i = ""

436

i = ""

437

try:

437

try:

438

f = self.opener(self.indexfile)

438

f = self.opener(self.indexfile)

439

i = f.read(4)

439

i = f.read(4)

440

f.seek(0)

440

f.seek(0)

441

if len(i) > 0:

441

if len(i) > 0:

442

v = struct.unpack(versionformat, i)[0]

442

v = struct.unpack(versionformat, i)[0]

443

except IOError, inst:

443

except IOError, inst:

444

if inst.errno != errno.ENOENT:

444

if inst.errno != errno.ENOENT:

445

raise

445

raise

446

447

self.version = v

447

self.version = v

448

self._inline = v & REVLOGNGINLINEDATA

448

self._inline = v & REVLOGNGINLINEDATA

449

flags = v & ~0xFFFF

449

flags = v & ~0xFFFF

450

fmt = v & 0xFFFF

450

fmt = v & 0xFFFF

451

if fmt == REVLOGV0 and flags:

451

if fmt == REVLOGV0 and flags:

452

raise RevlogError(_("index %s unknown flags %#04x for format v0")

452

raise RevlogError(_("index %s unknown flags %#04x for format v0")

453

% (self.indexfile, flags >> 16))

453

% (self.indexfile, flags >> 16))

454

elif fmt == REVLOGNG and flags & ~REVLOGNGINLINEDATA:

454

elif fmt == REVLOGNG and flags & ~REVLOGNGINLINEDATA:

455

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

455

raise RevlogError(_("index %s unknown flags %#04x for revlogng")

456

% (self.indexfile, flags >> 16))

456

% (self.indexfile, flags >> 16))

457

elif fmt > REVLOGNG:

457

elif fmt > REVLOGNG:

458

raise RevlogError(_("index %s unknown format %d")

458

raise RevlogError(_("index %s unknown format %d")

459

% (self.indexfile, fmt))

459

% (self.indexfile, fmt))

460

461

self._io = revlogio()

461

self._io = revlogio()

462

if self.version == REVLOGV0:

462

if self.version == REVLOGV0:

463

self._io = revlogoldio()

463

self._io = revlogoldio()

464

if i:

464

if i:

465

d = self._io.parseindex(f, self._inline)

465

d = self._io.parseindex(f, self._inline)

466

self.index, self.nodemap, self._chunkcache = d

466

self.index, self.nodemap, self._chunkcache = d

467

468

# add the magic null revision at -1

468

# add the magic null revision at -1

469

self.index.append((0, 0, 0, -1, -1, -1, -1, nullid))

469

self.index.append((0, 0, 0, -1, -1, -1, -1, nullid))

470

471

def _loadindex(self, start, end):

471

def _loadindex(self, start, end):

472

"""load a block of indexes all at once from the lazy parser"""

472

"""load a block of indexes all at once from the lazy parser"""

473

if isinstance(self.index, lazyindex):

473

if isinstance(self.index, lazyindex):

474

self.index.p.loadindex(start, end)

474

self.index.p.loadindex(start, end)

475

476

def _loadindexmap(self):

476

def _loadindexmap(self):

477

"""loads both the map and the index from the lazy parser"""

477

"""loads both the map and the index from the lazy parser"""

478

if isinstance(self.index, lazyindex):

478

if isinstance(self.index, lazyindex):

479

p = self.index.p

479

p = self.index.p

480

p.loadindex()

480

p.loadindex()

481

self.nodemap = p.map

481

self.nodemap = p.map

482

483

def _loadmap(self):

483

def _loadmap(self):

484

"""loads the map from the lazy parser"""

484

"""loads the map from the lazy parser"""

485

if isinstance(self.nodemap, lazymap):

485

if isinstance(self.nodemap, lazymap):

486

self.nodemap.p.loadmap()

486

self.nodemap.p.loadmap()

487

self.nodemap = self.nodemap.p.map

487

self.nodemap = self.nodemap.p.map

488

489

def tip(self):

489

def tip(self):

490

return self.node(len(self.index) - 2)

490

return self.node(len(self.index) - 2)

491

def count(self):

491

def count(self):

492

return len(self.index) - 1

492

return len(self.index) - 1

493

494

def rev(self, node):

494

def rev(self, node):

495

try:

495

try:

496

return self.nodemap[node]

496

return self.nodemap[node]

497

except KeyError:

497

except KeyError:

498

raise LookupError(_('%s: no node %s') % (self.indexfile, hex(node)))

498

raise LookupError(_('%s: no node %s') % (self.indexfile, hex(node)))

499

def node(self, rev):

499

def node(self, rev):

500

return self.index[rev][7]

500

return self.index[rev][7]

501

def linkrev(self, node):

501

def linkrev(self, node):

502

return self.index[self.rev(node)][4]

502

return self.index[self.rev(node)][4]

503

def parents(self, node):

503

def parents(self, node):

504

d = self.index[self.rev(node)][5:7]

504

d = self.index[self.rev(node)][5:7]

505

return (self.node(d[0]), self.node(d[1]))

505

return (self.node(d[0]), self.node(d[1]))

506

def parentrevs(self, rev):

506

def parentrevs(self, rev):

507

return self.index[rev][5:7]

507

return self.index[rev][5:7]

508

def start(self, rev):

508

def start(self, rev):

509

return getoffset(self.index[rev][0])

509

return getoffset(self.index[rev][0])

510

def end(self, rev):

510

def end(self, rev):

511

return self.start(rev) + self.length(rev)

511

return self.start(rev) + self.length(rev)

512

def length(self, rev):

512

def length(self, rev):

513

return self.index[rev][1]

513

return self.index[rev][1]

514

def base(self, rev):

514

def base(self, rev):

515

return self.index[rev][3]

515

return self.index[rev][3]

516

517

def size(self, rev):

517

def size(self, rev):

518

"""return the length of the uncompressed text for a given revision"""

518

"""return the length of the uncompressed text for a given revision"""

519

l = self.index[rev][2]

519

l = self.index[rev][2]

520

if l >= 0:

520

if l >= 0:

521

return l

521

return l

522

523

t = self.revision(self.node(rev))

523

t = self.revision(self.node(rev))

524

return len(t)

524

return len(t)

525

526

# alternate implementation, The advantage to this code is it

526

# alternate implementation, The advantage to this code is it

527

# will be faster for a single revision. But, the results are not

527

# will be faster for a single revision. But, the results are not

528

# cached, so finding the size of every revision will be slower.

528

# cached, so finding the size of every revision will be slower.

529

"""

529

"""

530

if self.cache and self.cache[1] == rev:

530

if self.cache and self.cache[1] == rev:

531

return len(self.cache[2])

531

return len(self.cache[2])

532

533

base = self.base(rev)

533

base = self.base(rev)

534

if self.cache and self.cache[1] >= base and self.cache[1] < rev:

534

if self.cache and self.cache[1] >= base and self.cache[1] < rev:

535

base = self.cache[1]

535

base = self.cache[1]

536

text = self.cache[2]

536

text = self.cache[2]

537

else:

537

else:

538

text = self.revision(self.node(base))

538

text = self.revision(self.node(base))

539

540

l = len(text)

540

l = len(text)

541

for x in xrange(base + 1, rev + 1):

541

for x in xrange(base + 1, rev + 1):

542

l = mdiff.patchedsize(l, self.chunk(x))

542

l = mdiff.patchedsize(l, self.chunk(x))

543

return l

543

return l

544

"""

544

"""

545

546

def reachable(self, node, stop=None):

546

def reachable(self, node, stop=None):

547

"""return a hash of all nodes ancestral to a given node, including

547

"""return a hash of all nodes ancestral to a given node, including

548

the node itself, stopping when stop is matched"""

548

the node itself, stopping when stop is matched"""

549

reachable = {}

549

reachable = {}

550

visit = [node]

550

visit = [node]

551

reachable[node] = 1

551

reachable[node] = 1

552

if stop:

552

if stop:

553

stopn = self.rev(stop)

553

stopn = self.rev(stop)

554

else:

554

else:

555

stopn = 0

555

stopn = 0

556

while visit:

556

while visit:

557

n = visit.pop(0)

557

n = visit.pop(0)

558

if n == stop:

558

if n == stop:

559

continue

559

continue

560

if n == nullid:

560

if n == nullid:

561

continue

561

continue

562

for p in self.parents(n):

562

for p in self.parents(n):

563

if self.rev(p) < stopn:

563

if self.rev(p) < stopn:

564

continue

564

continue

565

if p not in reachable:

565

if p not in reachable:

566

reachable[p] = 1

566

reachable[p] = 1

567

visit.append(p)

567

visit.append(p)

568

return reachable

568

return reachable

569

570

def nodesbetween(self, roots=None, heads=None):

570

def nodesbetween(self, roots=None, heads=None):

571

"""Return a tuple containing three elements. Elements 1 and 2 contain

571

"""Return a tuple containing three elements. Elements 1 and 2 contain

572

a final list bases and heads after all the unreachable ones have been

572

a final list bases and heads after all the unreachable ones have been

573

pruned. Element 0 contains a topologically sorted list of all

573

pruned. Element 0 contains a topologically sorted list of all

574

575

nodes that satisfy these constraints:

575

nodes that satisfy these constraints:

576

1. All nodes must be descended from a node in roots (the nodes on

576

1. All nodes must be descended from a node in roots (the nodes on

577

roots are considered descended from themselves).

577

roots are considered descended from themselves).

578

2. All nodes must also be ancestors of a node in heads (the nodes in

578

2. All nodes must also be ancestors of a node in heads (the nodes in

579

heads are considered to be their own ancestors).

579

heads are considered to be their own ancestors).

580

581

If roots is unspecified, nullid is assumed as the only root.

581

If roots is unspecified, nullid is assumed as the only root.

582

If heads is unspecified, it is taken to be the output of the

582

If heads is unspecified, it is taken to be the output of the

583

heads method (i.e. a list of all nodes in the repository that

583

heads method (i.e. a list of all nodes in the repository that

584

have no children)."""

584

have no children)."""

585

nonodes = ([], [], [])

585

nonodes = ([], [], [])

586

if roots is not None:

586

if roots is not None:

587

roots = list(roots)

587

roots = list(roots)

588

if not roots:

588

if not roots:

589

return nonodes

589

return nonodes

590

lowestrev = min([self.rev(n) for n in roots])

590

lowestrev = min([self.rev(n) for n in roots])

591

else:

591

else:

592

roots = [nullid] # Everybody's a descendent of nullid

592

roots = [nullid] # Everybody's a descendent of nullid

593

lowestrev = nullrev

593

lowestrev = nullrev

594

if (lowestrev == nullrev) and (heads is None):

594

if (lowestrev == nullrev) and (heads is None):

595

# We want _all_ the nodes!

595

# We want _all_ the nodes!

596

return ([self.node(r) for r in xrange(0, self.count())],

596

return ([self.node(r) for r in xrange(0, self.count())],

597

[nullid], list(self.heads()))

597

[nullid], list(self.heads()))

598

if heads is None:

598

if heads is None:

599

# All nodes are ancestors, so the latest ancestor is the last

599

# All nodes are ancestors, so the latest ancestor is the last

600

# node.

600

# node.

601

highestrev = self.count() - 1

601

highestrev = self.count() - 1

602

# Set ancestors to None to signal that every node is an ancestor.

602

# Set ancestors to None to signal that every node is an ancestor.

603

ancestors = None

603

ancestors = None

604

# Set heads to an empty dictionary for later discovery of heads

604

# Set heads to an empty dictionary for later discovery of heads

605

heads = {}

605

heads = {}

606

else:

606

else:

607

heads = list(heads)

607

heads = list(heads)

608

if not heads:

608

if not heads:

609

return nonodes

609

return nonodes

610

ancestors = {}

610

ancestors = {}

611

# Turn heads into a dictionary so we can remove 'fake' heads.

611

# Turn heads into a dictionary so we can remove 'fake' heads.

612

# Also, later we will be using it to filter out the heads we can't

612

# Also, later we will be using it to filter out the heads we can't

613

# find from roots.

613

# find from roots.

614

heads = dict.fromkeys(heads, 0)

614

heads = dict.fromkeys(heads, 0)

615

# Start at the top and keep marking parents until we're done.

615

# Start at the top and keep marking parents until we're done.

616

nodestotag = heads.keys()

616

nodestotag = heads.keys()

617

# Remember where the top was so we can use it as a limit later.

617

# Remember where the top was so we can use it as a limit later.

618

highestrev = max([self.rev(n) for n in nodestotag])

618

highestrev = max([self.rev(n) for n in nodestotag])

619

while nodestotag:

619

while nodestotag:

620

# grab a node to tag

620

# grab a node to tag

621

n = nodestotag.pop()

621

n = nodestotag.pop()

622

# Never tag nullid

622

# Never tag nullid

623

if n == nullid:

623

if n == nullid:

624

continue

624

continue

625

# A node's revision number represents its place in a

625

# A node's revision number represents its place in a

626

# topologically sorted list of nodes.

626

# topologically sorted list of nodes.

627

r = self.rev(n)

627

r = self.rev(n)

628

if r >= lowestrev:

628

if r >= lowestrev:

629

if n not in ancestors:

629

if n not in ancestors:

630

# If we are possibly a descendent of one of the roots

630

# If we are possibly a descendent of one of the roots

631

# and we haven't already been marked as an ancestor

631

# and we haven't already been marked as an ancestor

632

ancestors[n] = 1 # Mark as ancestor

632

ancestors[n] = 1 # Mark as ancestor

633

# Add non-nullid parents to list of nodes to tag.

633

# Add non-nullid parents to list of nodes to tag.

634

nodestotag.extend([p for p in self.parents(n) if

634

nodestotag.extend([p for p in self.parents(n) if

635

p != nullid])

635

p != nullid])

636

elif n in heads: # We've seen it before, is it a fake head?

636

elif n in heads: # We've seen it before, is it a fake head?

637

# So it is, real heads should not be the ancestors of

637

# So it is, real heads should not be the ancestors of

638

# any other heads.

638

# any other heads.

639

heads.pop(n)

639

heads.pop(n)

640

if not ancestors:

640

if not ancestors:

641

return nonodes

641

return nonodes

642

# Now that we have our set of ancestors, we want to remove any

642

# Now that we have our set of ancestors, we want to remove any

643

# roots that are not ancestors.

643

# roots that are not ancestors.

644

645

# If one of the roots was nullid, everything is included anyway.

645

# If one of the roots was nullid, everything is included anyway.

646

if lowestrev > nullrev:

646

if lowestrev > nullrev:

647

# But, since we weren't, let's recompute the lowest rev to not

647

# But, since we weren't, let's recompute the lowest rev to not

648

# include roots that aren't ancestors.

648

# include roots that aren't ancestors.

649

650

# Filter out roots that aren't ancestors of heads

650

# Filter out roots that aren't ancestors of heads

651

roots = [n for n in roots if n in ancestors]

651

roots = [n for n in roots if n in ancestors]

652

# Recompute the lowest revision

652

# Recompute the lowest revision

653

if roots:

653

if roots:

654

lowestrev = min([self.rev(n) for n in roots])

654

lowestrev = min([self.rev(n) for n in roots])

655

else:

655

else:

656

# No more roots? Return empty list

656

# No more roots? Return empty list

657

return nonodes

657

return nonodes

658

else:

658

else:

659

# We are descending from nullid, and don't need to care about

659

# We are descending from nullid, and don't need to care about

660

# any other roots.

660

# any other roots.

661

lowestrev = nullrev

661

lowestrev = nullrev

662

roots = [nullid]

662

roots = [nullid]

663

# Transform our roots list into a 'set' (i.e. a dictionary where the

663

# Transform our roots list into a 'set' (i.e. a dictionary where the

664

# values don't matter.

664

# values don't matter.

665

descendents = dict.fromkeys(roots, 1)

665

descendents = dict.fromkeys(roots, 1)

666

# Also, keep the original roots so we can filter out roots that aren't

666

# Also, keep the original roots so we can filter out roots that aren't

667

# 'real' roots (i.e. are descended from other roots).

667

# 'real' roots (i.e. are descended from other roots).

668

roots = descendents.copy()

668

roots = descendents.copy()

669

# Our topologically sorted list of output nodes.

669

# Our topologically sorted list of output nodes.

670

orderedout = []

670

orderedout = []

671

# Don't start at nullid since we don't want nullid in our output list,

671

# Don't start at nullid since we don't want nullid in our output list,

672

# and if nullid shows up in descedents, empty parents will look like

672

# and if nullid shows up in descedents, empty parents will look like

673

# they're descendents.

673

# they're descendents.

674

for r in xrange(max(lowestrev, 0), highestrev + 1):

674

for r in xrange(max(lowestrev, 0), highestrev + 1):

675

n = self.node(r)

675

n = self.node(r)

676

isdescendent = False

676

isdescendent = False

677

if lowestrev == nullrev: # Everybody is a descendent of nullid

677

if lowestrev == nullrev: # Everybody is a descendent of nullid

678

isdescendent = True

678

isdescendent = True

679

elif n in descendents:

679

elif n in descendents:

680

# n is already a descendent

680

# n is already a descendent

681

isdescendent = True

681

isdescendent = True

682

# This check only needs to be done here because all the roots

682

# This check only needs to be done here because all the roots

683

# will start being marked is descendents before the loop.

683

# will start being marked is descendents before the loop.

684

if n in roots:

684

if n in roots:

685

# If n was a root, check if it's a 'real' root.

685

# If n was a root, check if it's a 'real' root.

686

p = tuple(self.parents(n))

686

p = tuple(self.parents(n))

687

# If any of its parents are descendents, it's not a root.

687

# If any of its parents are descendents, it's not a root.

688

if (p[0] in descendents) or (p[1] in descendents):

688

if (p[0] in descendents) or (p[1] in descendents):

689

roots.pop(n)

689

roots.pop(n)

690

else:

690

else:

691

p = tuple(self.parents(n))

691

p = tuple(self.parents(n))

692

# A node is a descendent if either of its parents are

692

# A node is a descendent if either of its parents are

693

# descendents. (We seeded the dependents list with the roots

693

# descendents. (We seeded the dependents list with the roots

694

# up there, remember?)

694

# up there, remember?)

695

if (p[0] in descendents) or (p[1] in descendents):

695

if (p[0] in descendents) or (p[1] in descendents):

696

descendents[n] = 1

696

descendents[n] = 1

697

isdescendent = True

697

isdescendent = True

698

if isdescendent and ((ancestors is None) or (n in ancestors)):

698

if isdescendent and ((ancestors is None) or (n in ancestors)):

699

# Only include nodes that are both descendents and ancestors.

699

# Only include nodes that are both descendents and ancestors.

700

orderedout.append(n)

700

orderedout.append(n)

701

if (ancestors is not None) and (n in heads):

701

if (ancestors is not None) and (n in heads):

702

# We're trying to figure out which heads are reachable

702

# We're trying to figure out which heads are reachable

703

# from roots.

703

# from roots.

704

# Mark this head as having been reached

704

# Mark this head as having been reached

705

heads[n] = 1

705

heads[n] = 1

706

elif ancestors is None:

706

elif ancestors is None:

707

# Otherwise, we're trying to discover the heads.

707

# Otherwise, we're trying to discover the heads.

708

# Assume this is a head because if it isn't, the next step

708

# Assume this is a head because if it isn't, the next step

709

# will eventually remove it.

709

# will eventually remove it.

710

heads[n] = 1

710

heads[n] = 1

711

# But, obviously its parents aren't.

711

# But, obviously its parents aren't.

712

for p in self.parents(n):

712

for p in self.parents(n):

713

heads.pop(p, None)

713

heads.pop(p, None)

714

heads = [n for n in heads.iterkeys() if heads[n] != 0]

714

heads = [n for n in heads.iterkeys() if heads[n] != 0]

715

roots = roots.keys()

715

roots = roots.keys()

716

assert orderedout

716

assert orderedout

717

assert roots

717

assert roots

718

assert heads

718

assert heads

719

return (orderedout, roots, heads)

719

return (orderedout, roots, heads)

720

721

def heads(self, start=None, stop=None):

721

def heads(self, start=None, stop=None):

722

"""return the list of all nodes that have no children

722

"""return the list of all nodes that have no children

723

724

if start is specified, only heads that are descendants of

724

if start is specified, only heads that are descendants of

725

start will be returned

725

start will be returned

726

if stop is specified, it will consider all the revs from stop

726

if stop is specified, it will consider all the revs from stop

727

as if they had no children

727

as if they had no children

728

"""

728

"""

729

if start is None:

729

if start is None:

730

start = nullid

730

start = nullid

731

if stop is None:

731

if stop is None:

732

stop = []

732

stop = []

733

stoprevs = dict.fromkeys([self.rev(n) for n in stop])

733

stoprevs = dict.fromkeys([self.rev(n) for n in stop])

734

startrev = self.rev(start)

734

startrev = self.rev(start)

735

reachable = {startrev: 1}

735

reachable = {startrev: 1}

736

heads = {startrev: 1}

736

heads = {startrev: 1}

737

738

parentrevs = self.parentrevs

738

parentrevs = self.parentrevs

739

for r in xrange(startrev + 1, self.count()):

739

for r in xrange(startrev + 1, self.count()):

740

for p in parentrevs(r):

740

for p in parentrevs(r):

741

if p in reachable:

741

if p in reachable:

742

if r not in stoprevs:

742

if r not in stoprevs:

743

reachable[r] = 1

743

reachable[r] = 1

744

heads[r] = 1

744

heads[r] = 1

745

if p in heads and p not in stoprevs:

745

if p in heads and p not in stoprevs:

746

del heads[p]

746

del heads[p]

747

748

return [self.node(r) for r in heads]

748

return [self.node(r) for r in heads]

749

750

def children(self, node):

750

def children(self, node):

751

"""find the children of a given node"""

751

"""find the children of a given node"""

752

c = []

752

c = []

753

p = self.rev(node)

753

p = self.rev(node)

754

for r in range(p + 1, self.count()):

754

for r in range(p + 1, self.count()):

755

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

755

prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]

756

if prevs:

756

if prevs:

757

for pr in prevs:

757

for pr in prevs:

758

if pr == p:

758

if pr == p:

759

c.append(self.node(r))

759

c.append(self.node(r))

760

elif p == nullrev:

760

elif p == nullrev:

761

c.append(self.node(r))

761

c.append(self.node(r))

762

return c

762

return c

763

764

def _match(self, id):

764

def _match(self, id):

765

if isinstance(id, (long, int)):

765

if isinstance(id, (long, int)):

766

# rev

766

# rev

767

return self.node(id)

767

return self.node(id)

768

if len(id) == 20:

768

if len(id) == 20:

769

# possibly a binary node

769

# possibly a binary node

770

# odds of a binary node being all hex in ASCII are 1 in 10**25

770

# odds of a binary node being all hex in ASCII are 1 in 10**25

771

try:

771

try:

772

node = id

772

node = id

773

r = self.rev(node) # quick search the index

773

r = self.rev(node) # quick search the index

774

return node

774

return node

775

except LookupError:

775

except LookupError:

776

pass # may be partial hex id

776

pass # may be partial hex id

777

try:

777

try:

778

# str(rev)

778

# str(rev)

779

rev = int(id)

779

rev = int(id)

780

if str(rev) != id:

780

if str(rev) != id:

781

raise ValueError

781

raise ValueError

782

if rev < 0:

782

if rev < 0:

783

rev = self.count() + rev

783

rev = self.count() + rev

784

if rev < 0 or rev >= self.count():

784

if rev < 0 or rev >= self.count():

785

raise ValueError

785

raise ValueError

786

return self.node(rev)

786

return self.node(rev)

787

except (ValueError, OverflowError):

787

except (ValueError, OverflowError):

788

pass

788

pass

789

if len(id) == 40:

789

if len(id) == 40:

790

try:

790

try:

791

# a full hex nodeid?

791

# a full hex nodeid?

792

node = bin(id)

792

node = bin(id)

793

r = self.rev(node)

793

r = self.rev(node)

794

return node

794

return node

795

except TypeError:

795

except TypeError:

796

pass

796

pass

797

798

def _partialmatch(self, id):

798

def _partialmatch(self, id):

799

if len(id) < 40:

799

if len(id) < 40:

800

try:

800

try:

801

# hex(node)[:...]

801

# hex(node)[:...]

802

bin_id = bin(id[:len(id) & ~1]) # grab an even number of digits

802

bin_id = bin(id[:len(id) & ~1]) # grab an even number of digits

803

node = None

803

node = None

804

for n in self.nodemap:

804

for n in self.nodemap:

805

if n.startswith(bin_id) and hex(n).startswith(id):

805

if n.startswith(bin_id) and hex(n).startswith(id):

806

if node is not None:

806

if node is not None:

807

raise LookupError(_("Ambiguous identifier"))

807

raise LookupError(_("Ambiguous identifier"))

808

node = n

808

node = n

809

if node is not None:

809

if node is not None:

810

return node

810

return node

811

except TypeError:

811

except TypeError:

812

pass

812

pass

813

814

def lookup(self, id):

814

def lookup(self, id):

815

"""locate a node based on:

815

"""locate a node based on:

816

- revision number or str(revision number)

816

- revision number or str(revision number)

817

- nodeid or subset of hex nodeid

817

- nodeid or subset of hex nodeid

818

"""

818

"""

819

n = self._match(id)

819

n = self._match(id)

820

if n is not None:

820

if n is not None:

821

return n

821

return n

822

n = self._partialmatch(id)

822

n = self._partialmatch(id)

823

if n:

823

if n:

824

return n

824

return n

825

826

raise LookupError(_("No match found"))

826

raise LookupError(_("No match found"))

827

828

def cmp(self, node, text):

828

def cmp(self, node, text):

829

"""compare text with a given file revision"""

829

"""compare text with a given file revision"""

830

p1, p2 = self.parents(node)

830

p1, p2 = self.parents(node)

831

return hash(text, p1, p2) != node

831

return hash(text, p1, p2) != node

832

833

def diff(self, a, b):

834

"""return a delta between two revisions"""

835

return mdiff.textdiff(a, b)

836

837

def patches(self, t, pl):

838

"""apply a list of patches to a string"""

839

return mdiff.patches(t, pl)

840

841

def chunk(self, rev, df=None):

833

def chunk(self, rev, df=None):

842

start, length = self.start(rev), self.length(rev)

834

start, length = self.start(rev), self.length(rev)

843

if self._inline:

835

if self._inline:

844

start += (rev + 1) * self._io.size

836

start += (rev + 1) * self._io.size

845

end = start + length

837

end = start + length

846

def loadcache(df):

838

def loadcache(df):

847

cache_length = max(65536, length)

839

cache_length = max(65536, length)

848

if not df:

840

if not df:

849

if self._inline:

841

if self._inline:

850

df = self.opener(self.indexfile)

842

df = self.opener(self.indexfile)

851

else:

843

else:

852

df = self.opener(self.datafile)

844

df = self.opener(self.datafile)

853

df.seek(start)

845

df.seek(start)

854

self._chunkcache = (start, df.read(cache_length))

846

self._chunkcache = (start, df.read(cache_length))

855

847

856

if not self._chunkcache:

848

if not self._chunkcache:

857

loadcache(df)

849

loadcache(df)

858

850

859

cache_start = self._chunkcache[0]

851

cache_start = self._chunkcache[0]

860

cache_end = cache_start + len(self._chunkcache[1])

852

cache_end = cache_start + len(self._chunkcache[1])

861

if start >= cache_start and end <= cache_end:

853

if start >= cache_start and end <= cache_end:

862

# it is cached

854

# it is cached

863

offset = start - cache_start

855

offset = start - cache_start

864

else:

856

else:

865

loadcache(df)

857

loadcache(df)

866

offset = 0

858

offset = 0

867

859

868

# avoid copying large chunks

860

# avoid copying large chunks

869

c = self._chunkcache[1]

861

c = self._chunkcache[1]

870

if len(c) > length:

862

if len(c) > length:

871

c = c[offset:offset + length]

863

c = c[offset:offset + length]

872

864

873

return decompress(c)

865

return decompress(c)

874

866

875

def delta(self, node):

867

def delta(self, node):

876

"""return or calculate a delta between a node and its predecessor"""

868

"""return or calculate a delta between a node and its predecessor"""

877

r = self.rev(node)

869

r = self.rev(node)

878

return self.revdiff(r - 1, r)

870

return self.revdiff(r - 1, r)

879

871

880

def revdiff(self, rev1, rev2):

872

def revdiff(self, rev1, rev2):

881

"""return or calculate a delta between two revisions"""

873

"""return or calculate a delta between two revisions"""

882

b1 = self.base(rev1)

874

b1 = self.base(rev1)

883

b2 = self.base(rev2)

875

b2 = self.base(rev2)

884

if b1 == b2 and rev1 + 1 == rev2:

876

if b1 == b2 and rev1 + 1 == rev2:

885

return self.chunk(rev2)

877

return self.chunk(rev2)

886

else:

878

else:

887

return ~~sel~~f.diff(self.revision(self.node(rev1)),

879

return mdiff.textdiff(self.revision(self.node(rev1)),

888

self.revision(self.node(rev2)))

880

self.revision(self.node(rev2)))

889

881

890

def revision(self, node):

882

def revision(self, node):

891

"""return an uncompressed revision of a given"""

883

"""return an uncompressed revision of a given"""

892

if node == nullid:

884

if node == nullid:

893

return ""

885

return ""

894

if self._cache and self._cache[0] == node:

886

if self._cache and self._cache[0] == node:

895

return self._cache[2]

887

return self._cache[2]

896

888

897

# look up what we need to read

889

# look up what we need to read

898

text = None

890

text = None

899

rev = self.rev(node)

891

rev = self.rev(node)

900

base = self.base(rev)

892

base = self.base(rev)

901

893

902

if self._inline:

894

if self._inline:

903

# we probably have the whole chunk cached

895

# we probably have the whole chunk cached

904

df = None

896

df = None

905

else:

897

else:

906

df = self.opener(self.datafile)

898

df = self.opener(self.datafile)

907

899

908

# do we have useful data cached?

900

# do we have useful data cached?

909

if self._cache and self._cache[1] >= base and self._cache[1] < rev:

901

if self._cache and self._cache[1] >= base and self._cache[1] < rev:

910

base = self._cache[1]

902

base = self._cache[1]

911

text = self._cache[2]

903

text = self._cache[2]

912

self._loadindex(base, rev + 1)

904

self._loadindex(base, rev + 1)

913

else:

905

else:

914

self._loadindex(base, rev + 1)

906

self._loadindex(base, rev + 1)

915

text = self.chunk(base, df=df)

907

text = self.chunk(base, df=df)

916

908

917

bins = []

909

bins = [self.chunk(r, df) for r in xrange(base + 1, rev + 1)]

918

for r in xrange(base + 1, rev + 1):

910

text = mdiff.patches(text, bins)

919

bins.append(self.chunk(r, df=df))

920

921

text = self.patches(text, bins)

922

923

p1, p2 = self.parents(node)

911

p1, p2 = self.parents(node)

924

if node != hash(text, p1, p2):

912

if node != hash(text, p1, p2):

925

raise RevlogError(_("integrity check failed on %s:%d")

913

raise RevlogError(_("integrity check failed on %s:%d")

926

% (self.datafile, rev))

914

% (self.datafile, rev))

927

915

928

self._cache = (node, rev, text)

916

self._cache = (node, rev, text)

929

return text

917

return text

930

918

931

def checkinlinesize(self, tr, fp=None):

919

def checkinlinesize(self, tr, fp=None):

932

if not self._inline:

920

if not self._inline:

933

return

921

return

934

if not fp:

922

if not fp:

935

fp = self.opener(self.indexfile, 'r')

923

fp = self.opener(self.indexfile, 'r')

936

fp.seek(0, 2)

924

fp.seek(0, 2)

937

size = fp.tell()

925

size = fp.tell()

938

if size < 131072:

926

if size < 131072:

939

return

927

return

940

trinfo = tr.find(self.indexfile)

928

trinfo = tr.find(self.indexfile)

941

if trinfo == None:

929

if trinfo == None:

942

raise RevlogError(_("%s not found in the transaction")

930

raise RevlogError(_("%s not found in the transaction")

943

% self.indexfile)

931

% self.indexfile)

944

932

945

trindex = trinfo[2]

933

trindex = trinfo[2]

946

dataoff = self.start(trindex)

934

dataoff = self.start(trindex)

947

935

948

tr.add(self.datafile, dataoff)

936

tr.add(self.datafile, dataoff)

949

df = self.opener(self.datafile, 'w')

937

df = self.opener(self.datafile, 'w')

950

calc = self._io.size

938

calc = self._io.size

951

for r in xrange(self.count()):

939

for r in xrange(self.count()):

952

start = self.start(r) + (r + 1) * calc

940

start = self.start(r) + (r + 1) * calc

953

length = self.length(r)

941

length = self.length(r)

954

fp.seek(start)

942

fp.seek(start)

955

d = fp.read(length)

943

d = fp.read(length)

956

df.write(d)

944

df.write(d)

957

fp.close()

945

fp.close()

958

df.close()

946

df.close()

959

fp = self.opener(self.indexfile, 'w', atomictemp=True)

947

fp = self.opener(self.indexfile, 'w', atomictemp=True)

960

self.version &= ~(REVLOGNGINLINEDATA)

948

self.version &= ~(REVLOGNGINLINEDATA)

961

self._inline = False

949

self._inline = False

962

for i in xrange(self.count()):

950

for i in xrange(self.count()):

963

e = self._io.packentry(self.index[i], self.node, self.version)

951

e = self._io.packentry(self.index[i], self.node, self.version)

964

fp.write(e)

952

fp.write(e)

965

953

966

# if we don't call rename, the temp file will never replace the

954

# if we don't call rename, the temp file will never replace the

967

# real index

955

# real index

968

fp.rename()

956

fp.rename()

969

957

970

tr.replace(self.indexfile, trindex * calc)

958

tr.replace(self.indexfile, trindex * calc)

971

self._chunkcache = None

959

self._chunkcache = None

972

960

973

def addrevision(self, text, transaction, link, p1, p2, d=None):

961

def addrevision(self, text, transaction, link, p1, p2, d=None):

974

"""add a revision to the log

962

"""add a revision to the log

975

963

976

text - the revision data to add

964

text - the revision data to add

977

transaction - the transaction object used for rollback

965

transaction - the transaction object used for rollback

978

link - the linkrev data to add

966

link - the linkrev data to add

979

p1, p2 - the parent nodeids of the revision

967

p1, p2 - the parent nodeids of the revision

980

d - an optional precomputed delta

968

d - an optional precomputed delta

981

"""

969

"""

982

dfh = None

970

dfh = None

983

if not self._inline:

971

if not self._inline:

984

dfh = self.opener(self.datafile, "a")

972

dfh = self.opener(self.datafile, "a")

985

ifh = self.opener(self.indexfile, "a+")

973

ifh = self.opener(self.indexfile, "a+")

986

return self._addrevision(text, transaction, link, p1, p2, d, ifh, dfh)

974

return self._addrevision(text, transaction, link, p1, p2, d, ifh, dfh)

987

975

988

def _addrevision(self, text, transaction, link, p1, p2, d, ifh, dfh):

976

def _addrevision(self, text, transaction, link, p1, p2, d, ifh, dfh):

989

node = hash(text, p1, p2)

977

node = hash(text, p1, p2)

990

if node in self.nodemap:

978

if node in self.nodemap:

991

return node

979

return node

992

980

993

curr = self.count()

981

curr = self.count()

994

prev = curr - 1

982

prev = curr - 1

995

base = self.base(prev)

983

base = self.base(prev)

996

offset = self.end(prev)

984

offset = self.end(prev)

997

985

998

if curr:

986

if curr:

999

if not d:

987

if not d:

1000

ptext = self.revision(self.node(prev))

988

ptext = self.revision(self.node(prev))

1001

d = ~~sel~~f.diff(ptext, text)

989

d = mdiff.textdiff(ptext, text)

1002

data = compress(d)

990

data = compress(d)

1003

l = len(data[1]) + len(data[0])

991

l = len(data[1]) + len(data[0])

1004

dist = l + offset - self.start(base)

992

dist = l + offset - self.start(base)

1005

993

1006

# full versions are inserted when the needed deltas

994

# full versions are inserted when the needed deltas

1007

# become comparable to the uncompressed text

995

# become comparable to the uncompressed text

1008

if not curr or dist > len(text) * 2:

996

if not curr or dist > len(text) * 2:

1009

data = compress(text)

997

data = compress(text)

1010

l = len(data[1]) + len(data[0])

998

l = len(data[1]) + len(data[0])

1011

base = curr

999

base = curr

1012

1000

1013

e = (offset_type(offset, 0), l, len(text),

1001

e = (offset_type(offset, 0), l, len(text),

1014

base, link, self.rev(p1), self.rev(p2), node)

1002

base, link, self.rev(p1), self.rev(p2), node)

1015

self.index.insert(-1, e)

1003

self.index.insert(-1, e)

1016

self.nodemap[node] = curr

1004

self.nodemap[node] = curr

1017

1005

1018

entry = self._io.packentry(e, self.node, self.version)

1006

entry = self._io.packentry(e, self.node, self.version)

1019

if not self._inline:

1007

if not self._inline:

1020

transaction.add(self.datafile, offset)

1008

transaction.add(self.datafile, offset)

1021

transaction.add(self.indexfile, curr * len(entry))

1009

transaction.add(self.indexfile, curr * len(entry))

1022

if data[0]:

1010

if data[0]:

1023

dfh.write(data[0])

1011

dfh.write(data[0])

1024

dfh.write(data[1])

1012

dfh.write(data[1])

1025

dfh.flush()

1013

dfh.flush()

1026

ifh.write(entry)

1014

ifh.write(entry)

1027

else:

1015

else:

1028

ifh.seek(0, 2)

1016

ifh.seek(0, 2)

1029

transaction.add(self.indexfile, ifh.tell(), prev)

1017

transaction.add(self.indexfile, ifh.tell(), prev)

1030

ifh.write(entry)

1018

ifh.write(entry)

1031

ifh.write(data[0])

1019

ifh.write(data[0])

1032

ifh.write(data[1])

1020

ifh.write(data[1])

1033

self.checkinlinesize(transaction, ifh)

1021

self.checkinlinesize(transaction, ifh)

1034

1022

1035

self._cache = (node, curr, text)

1023

self._cache = (node, curr, text)

1036

return node

1024

return node

1037

1025

1038

def ancestor(self, a, b):

1026

def ancestor(self, a, b):

1039

"""calculate the least common ancestor of nodes a and b"""

1027

"""calculate the least common ancestor of nodes a and b"""

1040

1028

1041

def parents(rev):

1029

def parents(rev):

1042

return [p for p in self.parentrevs(rev) if p != nullrev]

1030

return [p for p in self.parentrevs(rev) if p != nullrev]

1043

1031

1044

c = ancestor.ancestor(self.rev(a), self.rev(b), parents)

1032

c = ancestor.ancestor(self.rev(a), self.rev(b), parents)

1045

if c is None:

1033

if c is None:

1046

return nullid

1034

return nullid

1047

1035

1048

return self.node(c)

1036

return self.node(c)

1049

1037

1050

def group(self, nodelist, lookup, infocollect=None):

1038

def group(self, nodelist, lookup, infocollect=None):

1051

"""calculate a delta group

1039

"""calculate a delta group

1052

1040

1053

Given a list of changeset revs, return a set of deltas and

1041

Given a list of changeset revs, return a set of deltas and

1054

metadata corresponding to nodes. the first delta is

1042

metadata corresponding to nodes. the first delta is

1055

parent(nodes[0]) -> nodes[0] the receiver is guaranteed to

1043

parent(nodes[0]) -> nodes[0] the receiver is guaranteed to

1056

have this parent as it has all history before these

1044

have this parent as it has all history before these

1057

changesets. parent is parent[0]

1045

changesets. parent is parent[0]

1058

"""

1046

"""

1059

revs = [self.rev(n) for n in nodelist]

1047

revs = [self.rev(n) for n in nodelist]

1060

1048

1061

# if we don't have any revisions touched by these changesets, bail

1049

# if we don't have any revisions touched by these changesets, bail

1062

if not revs:

1050

if not revs:

1063

yield changegroup.closechunk()

1051

yield changegroup.closechunk()

1064

return

1052

return

1065

1053

1066

# add the parent of the first rev

1054

# add the parent of the first rev

1067

p = self.parents(self.node(revs[0]))[0]

1055

p = self.parents(self.node(revs[0]))[0]

1068

revs.insert(0, self.rev(p))

1056

revs.insert(0, self.rev(p))

1069

1057

1070

# build deltas

1058

# build deltas

1071

for d in xrange(0, len(revs) - 1):

1059

for d in xrange(0, len(revs) - 1):

1072

a, b = revs[d], revs[d + 1]

1060

a, b = revs[d], revs[d + 1]

1073

nb = self.node(b)

1061

nb = self.node(b)

1074

1062

1075

if infocollect is not None:

1063

if infocollect is not None:

1076

infocollect(nb)

1064

infocollect(nb)

1077

1065

1078

d = self.revdiff(a, b)

1066

d = self.revdiff(a, b)

1079

p = self.parents(nb)

1067

p = self.parents(nb)

1080

meta = nb + p[0] + p[1] + lookup(nb)

1068

meta = nb + p[0] + p[1] + lookup(nb)

1081

yield changegroup.genchunk("%s%s" % (meta, d))

1069

yield changegroup.genchunk("%s%s" % (meta, d))

1082

1070

1083

yield changegroup.closechunk()

1071

yield changegroup.closechunk()

1084

1072

1085

def addgroup(self, revs, linkmapper, transaction, unique=0):

1073

def addgroup(self, revs, linkmapper, transaction, unique=0):

1086

"""

1074

"""

1087

add a delta group

1075

add a delta group

1088

1076

1089

given a set of deltas, add them to the revision log. the

1077

given a set of deltas, add them to the revision log. the

1090

first delta is against its parent, which should be in our

1078

first delta is against its parent, which should be in our

1091

log, the rest are against the previous delta.

1079

log, the rest are against the previous delta.

1092

"""

1080

"""

1093

1081

1094

#track the base of the current delta log

1082

#track the base of the current delta log

1095

r = self.count()

1083

r = self.count()

1096

t = r - 1

1084

t = r - 1

1097

node = None

1085

node = None

1098

1086

1099

base = prev = nullrev

1087

base = prev = nullrev

1100

start = end = textlen = 0

1088

start = end = textlen = 0

1101

if r:

1089

if r:

1102

end = self.end(t)

1090

end = self.end(t)

1103

1091

1104

ifh = self.opener(self.indexfile, "a+")

1092

ifh = self.opener(self.indexfile, "a+")

1105

ifh.seek(0, 2)

1093

ifh.seek(0, 2)

1106

transaction.add(self.indexfile, ifh.tell(), self.count())

1094

transaction.add(self.indexfile, ifh.tell(), self.count())

1107

if self._inline:

1095

if self._inline:

1108

dfh = None

1096

dfh = None

1109

else:

1097

else:

1110

transaction.add(self.datafile, end)

1098

transaction.add(self.datafile, end)

1111

dfh = self.opener(self.datafile, "a")

1099

dfh = self.opener(self.datafile, "a")

1112

1100

1113

# loop through our set of deltas

1101

# loop through our set of deltas

1114

chain = None

1102

chain = None

1115

for chunk in revs:

1103

for chunk in revs:

1116

node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80])

1104

node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80])

1117

link = linkmapper(cs)

1105

link = linkmapper(cs)

1118

if node in self.nodemap:

1106

if node in self.nodemap:

1119

# this can happen if two branches make the same change

1107

# this can happen if two branches make the same change

1120

# if unique:

1108

# if unique:

1121

# raise RevlogError(_("already have %s") % hex(node[:4]))

1109

# raise RevlogError(_("already have %s") % hex(node[:4]))

1122

chain = node

1110

chain = node

1123

continue

1111

continue

1124

delta = chunk[80:]

1112

delta = chunk[80:]

1125

1113

1126

for p in (p1, p2):

1114

for p in (p1, p2):

1127

if not p in self.nodemap:

1115

if not p in self.nodemap:

1128

raise LookupError(_("unknown parent %s") % short(p))

1116

raise LookupError(_("unknown parent %s") % short(p))

1129

1117

1130

if not chain:

1118

if not chain:

1131

# retrieve the parent revision of the delta chain

1119

# retrieve the parent revision of the delta chain

1132

chain = p1

1120

chain = p1

1133

if not chain in self.nodemap:

1121

if not chain in self.nodemap:

1134

raise LookupError(_("unknown base %s") % short(chain[:4]))

1122

raise LookupError(_("unknown base %s") % short(chain[:4]))

1135

1123

1136

# full versions are inserted when the needed deltas become

1124

# full versions are inserted when the needed deltas become

1137

# comparable to the uncompressed text or when the previous

1125

# comparable to the uncompressed text or when the previous

1138

# version is not the one we have a delta against. We use

1126

# version is not the one we have a delta against. We use

1139

# the size of the previous full rev as a proxy for the

1127

# the size of the previous full rev as a proxy for the

1140

# current size.

1128

# current size.

1141

1129

1142

if chain == prev:

1130

if chain == prev:

1143

tempd = compress(delta)

1131

tempd = compress(delta)

1144

cdelta = tempd[0] + tempd[1]

1132

cdelta = tempd[0] + tempd[1]

1145

textlen = mdiff.patchedsize(textlen, delta)

1133

textlen = mdiff.patchedsize(textlen, delta)

1146

1134

1147

if chain != prev or (end - start + len(cdelta)) > textlen * 2:

1135

if chain != prev or (end - start + len(cdelta)) > textlen * 2:

1148

# flush our writes here so we can read it in revision

1136

# flush our writes here so we can read it in revision

1149

if dfh:

1137

if dfh:

1150

dfh.flush()

1138

dfh.flush()

1151

ifh.flush()

1139

ifh.flush()

1152

text = self.revision(chain)

1140

text = self.revision(chain)

1153

text = ~~sel~~f.patches(text, [delta])

1141

text = mdiff.patches(text, [delta])

1154

chk = self._addrevision(text, transaction, link, p1, p2, None,

1142

chk = self._addrevision(text, transaction, link, p1, p2, None,

1155

ifh, dfh)

1143

ifh, dfh)

1156

if not dfh and not self._inline:

1144

if not dfh and not self._inline:

1157

# addrevision switched from inline to conventional

1145

# addrevision switched from inline to conventional

1158

# reopen the index

1146

# reopen the index

1159

dfh = self.opener(self.datafile, "a")

1147

dfh = self.opener(self.datafile, "a")

1160

ifh = self.opener(self.indexfile, "a")

1148

ifh = self.opener(self.indexfile, "a")

1161

if chk != node:

1149

if chk != node:

1162

raise RevlogError(_("consistency error adding group"))

1150

raise RevlogError(_("consistency error adding group"))

1163

textlen = len(text)

1151

textlen = len(text)

1164

else:

1152

else:

1165

e = (offset_type(end, 0), len(cdelta), textlen, base,

1153

e = (offset_type(end, 0), len(cdelta), textlen, base,

1166

link, self.rev(p1), self.rev(p2), node)

1154

link, self.rev(p1), self.rev(p2), node)

1167

self.index.insert(-1, e)

1155

self.index.insert(-1, e)

1168

self.nodemap[node] = r

1156

self.nodemap[node] = r

1169

entry = self._io.packentry(e, self.node, self.version)

1157

entry = self._io.packentry(e, self.node, self.version)

1170

if self._inline:

1158

if self._inline:

1171

ifh.write(entry)

1159

ifh.write(entry)

1172

ifh.write(cdelta)

1160

ifh.write(cdelta)

1173

self.checkinlinesize(transaction, ifh)

1161

self.checkinlinesize(transaction, ifh)

1174

if not self._inline:

1162

if not self._inline:

1175

dfh = self.opener(self.datafile, "a")

1163

dfh = self.opener(self.datafile, "a")

1176

ifh = self.opener(self.indexfile, "a")

1164

ifh = self.opener(self.indexfile, "a")

1177

else:

1165

else:

1178

dfh.write(cdelta)

1166

dfh.write(cdelta)

1179

ifh.write(entry)

1167

ifh.write(entry)

1180

1168

1181

t, r, chain, prev = r, r + 1, node, node

1169

t, r, chain, prev = r, r + 1, node, node

1182

base = self.base(t)

1170

base = self.base(t)

1183

start = self.start(base)

1171

start = self.start(base)

1184

end = self.end(t)

1172

end = self.end(t)

1185

1173

1186

return node

1174

return node

1187

1175

1188

def strip(self, rev, minlink):

1176

def strip(self, rev, minlink):

1189

if self.count() == 0 or rev >= self.count():

1177

if self.count() == 0 or rev >= self.count():

1190

return

1178

return

1191

1179

1192

if isinstance(self.index, lazyindex):

1180

if isinstance(self.index, lazyindex):

1193

self._loadindexmap()

1181

self._loadindexmap()

1194

1182

1195

# When stripping away a revision, we need to make sure it

1183

# When stripping away a revision, we need to make sure it

1196

# does not actually belong to an older changeset.

1184

# does not actually belong to an older changeset.

1197

# The minlink parameter defines the oldest revision

1185

# The minlink parameter defines the oldest revision

1198

# we're allowed to strip away.

1186

# we're allowed to strip away.

1199

while minlink > self.index[rev][4]:

1187

while minlink > self.index[rev][4]:

1200

rev += 1

1188

rev += 1

1201

if rev >= self.count():

1189

if rev >= self.count():

1202

return

1190

return

1203

1191

1204

# first truncate the files on disk

1192

# first truncate the files on disk

1205

end = self.start(rev)

1193

end = self.start(rev)

1206

if not self._inline:

1194

if not self._inline:

1207

df = self.opener(self.datafile, "a")

1195

df = self.opener(self.datafile, "a")

1208

df.truncate(end)

1196

df.truncate(end)

1209

end = rev * self._io.size

1197

end = rev * self._io.size

1210

else:

1198

else:

1211

end += rev * self._io.size

1199

end += rev * self._io.size

1212

1200

1213

indexf = self.opener(self.indexfile, "a")

1201

indexf = self.opener(self.indexfile, "a")

1214

indexf.truncate(end)

1202

indexf.truncate(end)

1215

1203

1216

# then reset internal state in memory to forget those revisions

1204

# then reset internal state in memory to forget those revisions

1217

self._cache = None

1205

self._cache = None

1218

self._chunkcache = None

1206

self._chunkcache = None

1219

for x in xrange(rev, self.count()):

1207

for x in xrange(rev, self.count()):

1220

del self.nodemap[self.node(x)]

1208

del self.nodemap[self.node(x)]

1221

1209

1222

del self.index[rev:-1]

1210

del self.index[rev:-1]

1223

1211

1224

def checksize(self):

1212

def checksize(self):

1225

expected = 0

1213

expected = 0

1226

if self.count():

1214

if self.count():

1227

expected = self.end(self.count() - 1)

1215

expected = self.end(self.count() - 1)

1228

1216

1229

try:

1217

try:

1230

f = self.opener(self.datafile)

1218

f = self.opener(self.datafile)

1231

f.seek(0, 2)

1219

f.seek(0, 2)

1232

actual = f.tell()

1220

actual = f.tell()

1233

dd = actual - expected

1221

dd = actual - expected

1234

except IOError, inst:

1222

except IOError, inst:

1235

if inst.errno != errno.ENOENT:

1223

if inst.errno != errno.ENOENT:

1236

raise

1224

raise

1237

dd = 0

1225

dd = 0

1238

1226

1239

try:

1227

try:

1240

f = self.opener(self.indexfile)

1228

f = self.opener(self.indexfile)

1241

f.seek(0, 2)

1229

f.seek(0, 2)

1242

actual = f.tell()

1230

actual = f.tell()

1243

s = self._io.size

1231

s = self._io.size

1244

i = actual / s

1232

i = actual / s

1245

di = actual - (i * s)

1233

di = actual - (i * s)

1246

if self._inline:

1234

if self._inline:

1247

databytes = 0

1235

databytes = 0

1248

for r in xrange(self.count()):

1236

for r in xrange(self.count()):

1249

databytes += self.length(r)

1237

databytes += self.length(r)

1250

dd = 0

1238

dd = 0

1251

di = actual - self.count() * s - databytes

1239

di = actual - self.count() * s - databytes

1252

except IOError, inst:

1240

except IOError, inst:

1253

if inst.errno != errno.ENOENT:

1241

if inst.errno != errno.ENOENT:

1254

raise

1242

raise

1255

di = 0

1243

di = 0

1256

1244

1257

return (dd, di)

1245

return (dd, di)

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             """
             bundlerepo.py - repository class for viewing uncompressed bundles
             This provides a read-only repository interface to bundles as if
             they were part of the actual repository.
             Copyright 2006, 2007 Benoit Boissinot <bboissin@gmail.com>
             This software may be used and distributed according to the terms
             of the GNU General Public License, incorporated herein by reference.
             """
             from node import *
             from i18n import _
-            import changegroup, util, os, struct, bz2, tempfile
+            import changegroup, util, os, struct, bz2, tempfile, mdiff
             import localrepo, changelog, manifest, filelog, revlog
             class bundlerevlog(revlog.revlog):
                 def __init__(self, opener, indexfile, bundlefile,
                              linkmapper=None):
                     # How it works:
                     # to retrieve a revision, we need to know the offset of
                     # the revision in the bundlefile (an opened file).
                     #
                     # We store this offset in the index (start), to differentiate a
                     # rev in the bundle and from a rev in the revlog, we check
                     # len(index[r]). If the tuple is bigger than 7, it is a bundle
                     # (it is bigger since we store the node to which the delta is)
                     #
                     revlog.revlog.__init__(self, opener, indexfile)
                     self.bundlefile = bundlefile
                     self.basemap = {}
                     def chunkpositer():
                         for chunk in changegroup.chunkiter(bundlefile):
                             pos = bundlefile.tell()
                             yield chunk, pos - len(chunk)
                     n = self.count()
                     prev = None
                     for chunk, start in chunkpositer():
                         size = len(chunk)
                         if size < 80:
                             raise util.Abort("invalid changegroup")
                         start += 80
                         size -= 80
                         node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80])
                         if node in self.nodemap:
                             prev = node
                             continue
                         for p in (p1, p2):
                             if not p in self.nodemap:
                                 raise revlog.LookupError(_("unknown parent %s") % short(p1))
                         if linkmapper is None:
                             link = n
                         else:
                             link = linkmapper(cs)
                         if not prev:
                             prev = p1
                         # start, size, base is not used, link, p1, p2, delta ref
                         e = (revlog.offset_type(start, 0), size, -1, None, link,
                              self.rev(p1), self.rev(p2), node)
                         self.basemap[n] = prev
                         self.index.insert(-1, e)
                         self.nodemap[node] = n
                         prev = node
                         n += 1
                 def bundle(self, rev):
                     """is rev from the bundle"""
                     if rev < 0:
                         return False
                     return rev in self.basemap
                 def bundlebase(self, rev): return self.basemap[rev]
                 def chunk(self, rev, df=None, cachelen=4096):
                     # Warning: in case of bundle, the diff is against bundlebase,
                     # not against rev - 1
                     # XXX: could use some caching
                     if not self.bundle(rev):
                         return revlog.revlog.chunk(self, rev, df)
                     self.bundlefile.seek(self.start(rev))
                     return self.bundlefile.read(self.length(rev))
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions"""
                     if self.bundle(rev1) and self.bundle(rev2):
                         # hot path for bundle
                         revb = self.rev(self.bundlebase(rev2))
                         if revb == rev1:
                             return self.chunk(rev2)
                     elif not self.bundle(rev1) and not self.bundle(rev2):
                         return revlog.revlog.revdiff(self, rev1, rev2)
-                    return self.diff(self.revision(self.node(rev1)),
+                    return mdiff.textdiff(self.revision(self.node(rev1)),
                                      self.revision(self.node(rev2)))
                 def revision(self, node):
                     """return an uncompressed revision of a given"""
                     if node == nullid: return ""
                     text = None
                     chain = []
                     iter_node = node
                     rev = self.rev(iter_node)
                     # reconstruct the revision if it is from a changegroup
                     while self.bundle(rev):
                         if self._cache and self._cache[0] == iter_node:
                             text = self._cache[2]
                             break
                         chain.append(rev)
                         iter_node = self.bundlebase(rev)
                         rev = self.rev(iter_node)
                     if text is None:
                         text = revlog.revlog.revision(self, iter_node)
                     while chain:
                         delta = self.chunk(chain.pop())
-                        text = self.patches(text, [delta])
+                        text = mdiff.patches(text, [delta])
                     p1, p2 = self.parents(node)
                     if node != revlog.hash(text, p1, p2):
                         raise revlog.RevlogError(_("integrity check failed on %s:%d")
                                                  % (self.datafile, self.rev(node)))
                     self._cache = (node, self.rev(node), text)
                     return text
                 def addrevision(self, text, transaction, link, p1=None, p2=None, d=None):
                     raise NotImplementedError
                 def addgroup(self, revs, linkmapper, transaction, unique=0):
                     raise NotImplementedError
                 def strip(self, rev, minlink):
                     raise NotImplementedError
                 def checksize(self):
                     raise NotImplementedError
             class bundlechangelog(bundlerevlog, changelog.changelog):
                 def __init__(self, opener, bundlefile):
                     changelog.changelog.__init__(self, opener)
                     bundlerevlog.__init__(self, opener, self.indexfile, bundlefile)
             class bundlemanifest(bundlerevlog, manifest.manifest):
                 def __init__(self, opener, bundlefile, linkmapper):
                     manifest.manifest.__init__(self, opener)
                     bundlerevlog.__init__(self, opener, self.indexfile, bundlefile,
                                           linkmapper)
             class bundlefilelog(bundlerevlog, filelog.filelog):
                 def __init__(self, opener, path, bundlefile, linkmapper):
                     filelog.filelog.__init__(self, opener, path)
                     bundlerevlog.__init__(self, opener, self.indexfile, bundlefile,
                                           linkmapper)
             class bundlerepository(localrepo.localrepository):
                 def __init__(self, ui, path, bundlename):
                     localrepo.localrepository.__init__(self, ui, path)
                     self._url = 'bundle:' + bundlename
                     if path: self._url += '+' + path
                     self.tempfile = None
                     self.bundlefile = open(bundlename, "rb")
                     header = self.bundlefile.read(6)
                     if not header.startswith("HG"):
                         raise util.Abort(_("%s: not a Mercurial bundle file") % bundlename)
                     elif not header.startswith("HG10"):
                         raise util.Abort(_("%s: unknown bundle version") % bundlename)
                     elif header == "HG10BZ":
                         fdtemp, temp = tempfile.mkstemp(prefix="hg-bundle-",
                                                         suffix=".hg10un", dir=self.path)
                         self.tempfile = temp
                         fptemp = os.fdopen(fdtemp, 'wb')
                         def generator(f):
                             zd = bz2.BZ2Decompressor()
                             zd.decompress("BZ")
                             for chunk in f:
                                 yield zd.decompress(chunk)
                         gen = generator(util.filechunkiter(self.bundlefile, 4096))
                         try:
                             fptemp.write("HG10UN")
                             for chunk in gen:
                                 fptemp.write(chunk)
                         finally:
                             fptemp.close()
                             self.bundlefile.close()
                         self.bundlefile = open(self.tempfile, "rb")
                         # seek right after the header
                         self.bundlefile.seek(6)
                     elif header == "HG10UN":
                         # nothing to do
                         pass
                     else:
                         raise util.Abort(_("%s: unknown bundle compression type")
                                          % bundlename)
                     self.changelog = bundlechangelog(self.sopener, self.bundlefile)
                     self.manifest = bundlemanifest(self.sopener, self.bundlefile,
                                                    self.changelog.rev)
                     # dict with the mapping 'filename' -> position in the bundle
                     self.bundlefilespos = {}
                     while 1:
                         f = changegroup.getchunk(self.bundlefile)
                         if not f:
                             break
                         self.bundlefilespos[f] = self.bundlefile.tell()
                         for c in changegroup.chunkiter(self.bundlefile):
                             pass
                 def url(self):
                     return self._url
                 def dev(self):
                     return -1
                 def file(self, f):
                     if f[0] == '/':
                         f = f[1:]
                     if f in self.bundlefilespos:
                         self.bundlefile.seek(self.bundlefilespos[f])
                         return bundlefilelog(self.sopener, f, self.bundlefile,
                                              self.changelog.rev)
                     else:
                         return filelog.filelog(self.sopener, f)
                 def close(self):
                     """Close assigned bundle file immediately."""
                     self.bundlefile.close()
                 def __del__(self):
                     bundlefile = getattr(self, 'bundlefile', None)
                     if bundlefile and not bundlefile.closed:
                         bundlefile.close()
                     tempfile = getattr(self, 'tempfile', None)
                     if tempfile is not None:
                         os.unlink(tempfile)
             def instance(ui, path, create):
                 if create:
                     raise util.Abort(_('cannot create new bundle repository'))
                 path = util.drop_scheme('file', path)
                 if path.startswith('bundle:'):
                     path = util.drop_scheme('bundle', path)
                     s = path.split("+", 1)
                     if len(s) == 1:
                         repopath, bundlename = "", s[0]
                     else:
                         repopath, bundlename = s
                 else:
                     repopath, bundlename = '', path
                 return bundlerepository(ui, repopath, bundlename)

             """
             revlog.py - storage back-end for mercurial
             This provides efficient delta storage with O(1) retrieve and append
             and O(changes) merge between branches
             Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             This software may be used and distributed according to the terms
             of the GNU General Public License, incorporated herein by reference.
             """
             from node import *
             from i18n import _
             import binascii, changegroup, errno, ancestor, mdiff, os
             import sha, struct, util, zlib
             # revlog flags
             REVLOGV0 = 0
             REVLOGNG = 1
             REVLOGNGINLINEDATA = (1 << 16)
             REVLOG_DEFAULT_FLAGS = REVLOGNGINLINEDATA
             REVLOG_DEFAULT_FORMAT = REVLOGNG
             REVLOG_DEFAULT_VERSION = REVLOG_DEFAULT_FORMAT | REVLOG_DEFAULT_FLAGS
             class RevlogError(Exception):
                 pass
             class LookupError(RevlogError):
                 pass
             def getoffset(q):
                 if q & 0xFFFF:
                     raise RevlogError(_('incompatible revision flag %x') % q)
                 return int(q >> 16)
             def gettype(q):
                 return int(q & 0xFFFF)
             def offset_type(offset, type):
                 return long(long(offset) << 16 | type)
             def hash(text, p1, p2):
                 """generate a hash from the given text and its parent hashes
                 This hash combines both the current file contents and its history
                 in a manner that makes it easy to distinguish nodes with the same
                 content in the revision graph.
                 """
                 l = [p1, p2]
                 l.sort()
                 s = sha.new(l[0])
                 s.update(l[1])
                 s.update(text)
                 return s.digest()
             def compress(text):
                 """ generate a possibly-compressed representation of text """
                 if not text:
                     return ("", text)
                 if len(text) < 44:
                     if text[0] == '\0':
                         return ("", text)
                     return ('u', text)
                 bin = zlib.compress(text)
                 if len(bin) > len(text):
                     if text[0] == '\0':
                         return ("", text)
                     return ('u', text)
                 return ("", bin)
             def decompress(bin):
                 """ decompress the given input """
                 if not bin:
                     return bin
                 t = bin[0]
                 if t == '\0':
                     return bin
                 if t == 'x':
                     return zlib.decompress(bin)
                 if t == 'u':
                     return bin[1:]
                 raise RevlogError(_("unknown compression type %r") % t)
             class lazyparser(object):
                 """
                 this class avoids the need to parse the entirety of large indices
                 """
                 # lazyparser is not safe to use on windows if win32 extensions not
                 # available. it keeps file handle open, which make it not possible
                 # to break hardlinks on local cloned repos.
                 safe_to_use = os.name != 'nt' or (not util.is_win_9x() and
                                                   hasattr(util, 'win32api'))
                 def __init__(self, dataf, size):
                     self.dataf = dataf
                     self.s = struct.calcsize(indexformatng)
                     self.datasize = size
                     self.l = size/self.s
                     self.index = [None] * self.l
                     self.map = {nullid: nullrev}
                     self.allmap = 0
                     self.all = 0
                     self.mapfind_count = 0
                 def loadmap(self):
                     """
                     during a commit, we need to make sure the rev being added is
                     not a duplicate.  This requires loading the entire index,
                     which is fairly slow.  loadmap can load up just the node map,
                     which takes much less time.
                     """
                     if self.allmap:
                         return
                     end = self.datasize
                     self.allmap = 1
                     cur = 0
                     count = 0
                     blocksize = self.s * 256
                     self.dataf.seek(0)
                     while cur < end:
                         data = self.dataf.read(blocksize)
                         off = 0
                         for x in xrange(256):
                             n = data[off + ngshaoffset:off + ngshaoffset + 20]
                             self.map[n] = count
                             count += 1
                             if count >= self.l:
                                 break
                             off += self.s
                         cur += blocksize
                 def loadblock(self, blockstart, blocksize, data=None):
                     if self.all:
                         return
                     if data is None:
                         self.dataf.seek(blockstart)
                         if blockstart + blocksize > self.datasize:
                             # the revlog may have grown since we've started running,
                             # but we don't have space in self.index for more entries.
                             # limit blocksize so that we don't get too much data.
                             blocksize = max(self.datasize - blockstart, 0)
                         data = self.dataf.read(blocksize)
                     lend = len(data) / self.s
                     i = blockstart / self.s
                     off = 0
                     # lazyindex supports __delitem__
                     if lend > len(self.index) - i:
                         lend = len(self.index) - i
                     for x in xrange(lend):
                         if self.index[i + x] == None:
                             b = data[off : off + self.s]
                             self.index[i + x] = b
                             n = b[ngshaoffset:ngshaoffset + 20]
                             self.map[n] = i + x
                         off += self.s
                 def findnode(self, node):
                     """search backwards through the index file for a specific node"""
                     if self.allmap:
                         return None
                     # hg log will cause many many searches for the manifest
                     # nodes.  After we get called a few times, just load the whole
                     # thing.
                     if self.mapfind_count > 8:
                         self.loadmap()
                         if node in self.map:
                             return node
                         return None
                     self.mapfind_count += 1
                     last = self.l - 1
                     while self.index[last] != None:
                         if last == 0:
                             self.all = 1
                             self.allmap = 1
                             return None
                         last -= 1
                     end = (last + 1) * self.s
                     blocksize = self.s * 256
                     while end >= 0:
                         start = max(end - blocksize, 0)
                         self.dataf.seek(start)
                         data = self.dataf.read(end - start)
                         findend = end - start
                         while True:
                             # we're searching backwards, so weh have to make sure
                             # we don't find a changeset where this node is a parent
                             off = data.rfind(node, 0, findend)
                             findend = off
                             if off >= 0:
                                 i = off / self.s
                                 off = i * self.s
                                 n = data[off + ngshaoffset:off + ngshaoffset + 20]
                                 if n == node:
                                     self.map[n] = i + start / self.s
                                     return node
                             else:
                                 break
                         end -= blocksize
                     return None
                 def loadindex(self, i=None, end=None):
                     if self.all:
                         return
                     all = False
                     if i == None:
                         blockstart = 0
                         blocksize = (512 / self.s) * self.s
                         end = self.datasize
                         all = True
                     else:
                         if end:
                             blockstart = i * self.s
                             end = end * self.s
                             blocksize = end - blockstart
                         else:
                             blockstart = (i & ~63) * self.s
                             blocksize = self.s * 64
                             end = blockstart + blocksize
                     while blockstart < end:
                         self.loadblock(blockstart, blocksize)
                         blockstart += blocksize
                     if all:
                         self.all = True
             class lazyindex(object):
                 """a lazy version of the index array"""
                 def __init__(self, parser):
                     self.p = parser
                 def __len__(self):
                     return len(self.p.index)
                 def load(self, pos):
                     if pos < 0:
                         pos += len(self.p.index)
                     self.p.loadindex(pos)
                     return self.p.index[pos]
                 def __getitem__(self, pos):
                     ret = self.p.index[pos] or self.load(pos)
                     if isinstance(ret, str):
                         ret = struct.unpack(indexformatng, ret)
                     return ret
                 def __setitem__(self, pos, item):
                     self.p.index[pos] = item
                 def __delitem__(self, pos):
                     del self.p.index[pos]
                 def insert(self, pos, e):
                     self.p.index.insert(pos, e)
                 def append(self, e):
                     self.p.index.append(e)
             class lazymap(object):
                 """a lazy version of the node map"""
                 def __init__(self, parser):
                     self.p = parser
                 def load(self, key):
                     n = self.p.findnode(key)
                     if n == None:
                         raise KeyError(key)
                 def __contains__(self, key):
                     if key in self.p.map:
                         return True
                     self.p.loadmap()
                     return key in self.p.map
                 def __iter__(self):
                     yield nullid
                     for i in xrange(self.p.l):
                         ret = self.p.index[i]
                         if not ret:
                             self.p.loadindex(i)
                             ret = self.p.index[i]
                         if isinstance(ret, str):
                             ret = struct.unpack(indexformatng, ret)
                         yield ret[7]
                 def __getitem__(self, key):
                     try:
                         return self.p.map[key]
                     except KeyError:
                         try:
                             self.load(key)
                             return self.p.map[key]
                         except KeyError:
                             raise KeyError("node " + hex(key))
                 def __setitem__(self, key, val):
                     self.p.map[key] = val
                 def __delitem__(self, key):
                     del self.p.map[key]
             indexformatv0 = ">4l20s20s20s"
             v0shaoffset = 56
             class revlogoldio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatv0)
                 def parseindex(self, fp, inline):
                     s = self.size
                     index = []
                     nodemap =  {nullid: nullrev}
                     n = off = 0
                     data = fp.read()
                     l = len(data)
                     while off + s <= l:
                         cur = data[off:off + s]
                         off += s
                         e = struct.unpack(indexformatv0, cur)
                         # transform to revlogv1 format
                         e2 = (offset_type(e[0], 0), e[1], -1, e[2], e[3],
                               nodemap[e[4]], nodemap[e[5]], e[6])
                         index.append(e2)
                         nodemap[e[6]] = n
                         n += 1
                     return index, nodemap, None
                 def packentry(self, entry, node, version):
                     e2 = (getoffset(entry[0]), entry[1], entry[3], entry[4],
                           node(entry[5]), node(entry[6]), entry[7])
                     return struct.pack(indexformatv0, *e2)
             # index ng:
             # 6 bytes offset
             # 2 bytes flags
             # 4 bytes compressed length
             # 4 bytes uncompressed length
             # 4 bytes: base rev
             # 4 bytes link rev
             # 4 bytes parent 1 rev
             # 4 bytes parent 2 rev
             # 32 bytes: nodeid
             indexformatng = ">Qiiiiii20s12x"
             ngshaoffset = 32
             versionformat = ">I"
             class revlogio(object):
                 def __init__(self):
                     self.size = struct.calcsize(indexformatng)
                 def parseindex(self, fp, inline):
                     try:
                         size = util.fstat(fp).st_size
                     except AttributeError:
                         size = 0
                     if lazyparser.safe_to_use and not inline and size > 1000000:
                         # big index, let's parse it on demand
                         parser = lazyparser(fp, size)
                         index = lazyindex(parser)
                         nodemap = lazymap(parser)
                         e = list(index[0])
                         type = gettype(e[0])
                         e[0] = offset_type(0, type)
                         index[0] = e
                         return index, nodemap, None
                     s = self.size
                     cache = None
                     index = []
                     nodemap =  {nullid: nullrev}
                     n = off = 0
                     # if we're not using lazymap, always read the whole index
                     data = fp.read()
                     l = len(data)
                     if inline:
                         cache = (0, data)
                     while off + s <= l:
                         e = struct.unpack(indexformatng, data[off:off + s])
                         index.append(e)
                         nodemap[e[7]] = n
                         n += 1
                         off += s
                         if inline:
                             if e[1] < 0:
                                 break
                             off += e[1]
                     e = list(index[0])
                     type = gettype(e[0])
                     e[0] = offset_type(0, type)
                     index[0] = e
                     return index, nodemap, cache
                 def packentry(self, entry, node, version):
                     p = struct.pack(indexformatng, *entry)
                     if not entry[3] and not getoffset(entry[0]) and entry[5] == nullrev:
                         p = struct.pack(versionformat, version) + p[4:]
                     return p
             class revlog(object):
                 """
                 the underlying revision storage object
                 A revlog consists of two parts, an index and the revision data.
                 The index is a file with a fixed record size containing
                 information on each revision, includings its nodeid (hash), the
                 nodeids of its parents, the position and offset of its data within
                 the data file, and the revision it's based on. Finally, each entry
                 contains a linkrev entry that can serve as a pointer to external
                 data.
                 The revision data itself is a linear collection of data chunks.
                 Each chunk represents a revision and is usually represented as a
                 delta against the previous chunk. To bound lookup time, runs of
                 deltas are limited to about 2 times the length of the original
                 version data. This makes retrieval of a version proportional to
                 its size, or O(1) relative to the number of revisions.
                 Both pieces of the revlog are written to in an append-only
                 fashion, which means we never need to rewrite a file to insert or
                 remove data, and can use some simple techniques to avoid the need
                 for locking while reading.
                 """
                 def __init__(self, opener, indexfile):
                     """
                     create a revlog object
                     opener is a function that abstracts the file opening operation
                     and can be used to implement COW semantics or the like.
                     """
                     self.indexfile = indexfile
                     self.datafile = indexfile[:-2] + ".d"
                     self.opener = opener
                     self._cache = None
                     self._chunkcache = None
                     self.nodemap = {nullid: nullrev}
                     self.index = []
                     v = REVLOG_DEFAULT_VERSION
                     if hasattr(opener, "defversion"):
                         v = opener.defversion
                         if v & REVLOGNG:
                             v |= REVLOGNGINLINEDATA
                     i = ""
                     try:
                         f = self.opener(self.indexfile)
                         i = f.read(4)
                         f.seek(0)
                         if len(i) > 0:
                             v = struct.unpack(versionformat, i)[0]
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                     self.version = v
                     self._inline = v & REVLOGNGINLINEDATA
                     flags = v & ~0xFFFF
                     fmt = v & 0xFFFF
                     if fmt == REVLOGV0 and flags:
                         raise RevlogError(_("index %s unknown flags %#04x for format v0")
                                           % (self.indexfile, flags >> 16))
                     elif fmt == REVLOGNG and flags & ~REVLOGNGINLINEDATA:
                         raise RevlogError(_("index %s unknown flags %#04x for revlogng")
                                           % (self.indexfile, flags >> 16))
                     elif fmt > REVLOGNG:
                         raise RevlogError(_("index %s unknown format %d")
                                           % (self.indexfile, fmt))
                     self._io = revlogio()
                     if self.version == REVLOGV0:
                         self._io = revlogoldio()
                     if i:
                         d = self._io.parseindex(f, self._inline)
                         self.index, self.nodemap, self._chunkcache = d
                     # add the magic null revision at -1
                     self.index.append((0, 0, 0, -1, -1, -1, -1, nullid))
                 def _loadindex(self, start, end):
                     """load a block of indexes all at once from the lazy parser"""
                     if isinstance(self.index, lazyindex):
                         self.index.p.loadindex(start, end)
                 def _loadindexmap(self):
                     """loads both the map and the index from the lazy parser"""
                     if isinstance(self.index, lazyindex):
                         p = self.index.p
                         p.loadindex()
                         self.nodemap = p.map
                 def _loadmap(self):
                     """loads the map from the lazy parser"""
                     if isinstance(self.nodemap, lazymap):
                         self.nodemap.p.loadmap()
                         self.nodemap = self.nodemap.p.map
                 def tip(self):
                     return self.node(len(self.index) - 2)
                 def count(self):
                     return len(self.index) - 1
                 def rev(self, node):
                     try:
                         return self.nodemap[node]
                     except KeyError:
                         raise LookupError(_('%s: no node %s') % (self.indexfile, hex(node)))
                 def node(self, rev):
                     return self.index[rev][7]
                 def linkrev(self, node):
                     return self.index[self.rev(node)][4]
                 def parents(self, node):
                     d = self.index[self.rev(node)][5:7]
                     return (self.node(d[0]), self.node(d[1]))
                 def parentrevs(self, rev):
                     return self.index[rev][5:7]
                 def start(self, rev):
                     return getoffset(self.index[rev][0])
                 def end(self, rev):
                     return self.start(rev) + self.length(rev)
                 def length(self, rev):
                     return self.index[rev][1]
                 def base(self, rev):
                     return self.index[rev][3]
                 def size(self, rev):
                     """return the length of the uncompressed text for a given revision"""
                     l = self.index[rev][2]
                     if l >= 0:
                         return l
                     t = self.revision(self.node(rev))
                     return len(t)
                     # alternate implementation, The advantage to this code is it
                     # will be faster for a single revision.  But, the results are not
                     # cached, so finding the size of every revision will be slower.
                     """
                     if self.cache and self.cache[1] == rev:
                         return len(self.cache[2])
                     base = self.base(rev)
                     if self.cache and self.cache[1] >= base and self.cache[1] < rev:
                         base = self.cache[1]
                         text = self.cache[2]
                     else:
                         text = self.revision(self.node(base))
                     l = len(text)
                     for x in xrange(base + 1, rev + 1):
                         l = mdiff.patchedsize(l, self.chunk(x))
                     return l
                     """
                 def reachable(self, node, stop=None):
                     """return a hash of all nodes ancestral to a given node, including
                      the node itself, stopping when stop is matched"""
                     reachable = {}
                     visit = [node]
                     reachable[node] = 1
                     if stop:
                         stopn = self.rev(stop)
                     else:
                         stopn = 0
                     while visit:
                         n = visit.pop(0)
                         if n == stop:
                             continue
                         if n == nullid:
                             continue
                         for p in self.parents(n):
                             if self.rev(p) < stopn:
                                 continue
                             if p not in reachable:
                                 reachable[p] = 1
                                 visit.append(p)
                     return reachable
                 def nodesbetween(self, roots=None, heads=None):
                     """Return a tuple containing three elements. Elements 1 and 2 contain
                     a final list bases and heads after all the unreachable ones have been
                     pruned.  Element 0 contains a topologically sorted list of all
                     nodes that satisfy these constraints:
 . All nodes must be descended from a node in roots (the nodes on
                        roots are considered descended from themselves).
 . All nodes must also be ancestors of a node in heads (the nodes in
                        heads are considered to be their own ancestors).
                     If roots is unspecified, nullid is assumed as the only root.
                     If heads is unspecified, it is taken to be the output of the
                     heads method (i.e. a list of all nodes in the repository that
                     have no children)."""
                     nonodes = ([], [], [])
                     if roots is not None:
                         roots = list(roots)
                         if not roots:
                             return nonodes
                         lowestrev = min([self.rev(n) for n in roots])
                     else:
                         roots = [nullid] # Everybody's a descendent of nullid
                         lowestrev = nullrev
                     if (lowestrev == nullrev) and (heads is None):
                         # We want _all_ the nodes!
                         return ([self.node(r) for r in xrange(0, self.count())],
                                 [nullid], list(self.heads()))
                     if heads is None:
                         # All nodes are ancestors, so the latest ancestor is the last
                         # node.
                         highestrev = self.count() - 1
                         # Set ancestors to None to signal that every node is an ancestor.
                         ancestors = None
                         # Set heads to an empty dictionary for later discovery of heads
                         heads = {}
                     else:
                         heads = list(heads)
                         if not heads:
                             return nonodes
                         ancestors = {}
                         # Turn heads into a dictionary so we can remove 'fake' heads.
                         # Also, later we will be using it to filter out the heads we can't
                         # find from roots.
                         heads = dict.fromkeys(heads, 0)
                         # Start at the top and keep marking parents until we're done.
                         nodestotag = heads.keys()
                         # Remember where the top was so we can use it as a limit later.
                         highestrev = max([self.rev(n) for n in nodestotag])
                         while nodestotag:
                             # grab a node to tag
                             n = nodestotag.pop()
                             # Never tag nullid
                             if n == nullid:
                                 continue
                             # A node's revision number represents its place in a
                             # topologically sorted list of nodes.
                             r = self.rev(n)
                             if r >= lowestrev:
                                 if n not in ancestors:
                                     # If we are possibly a descendent of one of the roots
                                     # and we haven't already been marked as an ancestor
                                     ancestors[n] = 1 # Mark as ancestor
                                     # Add non-nullid parents to list of nodes to tag.
                                     nodestotag.extend([p for p in self.parents(n) if
                                                        p != nullid])
                                 elif n in heads: # We've seen it before, is it a fake head?
                                     # So it is, real heads should not be the ancestors of
                                     # any other heads.
                                     heads.pop(n)
                         if not ancestors:
                             return nonodes
                         # Now that we have our set of ancestors, we want to remove any
                         # roots that are not ancestors.
                         # If one of the roots was nullid, everything is included anyway.
                         if lowestrev > nullrev:
                             # But, since we weren't, let's recompute the lowest rev to not
                             # include roots that aren't ancestors.
                             # Filter out roots that aren't ancestors of heads
                             roots = [n for n in roots if n in ancestors]
                             # Recompute the lowest revision
                             if roots:
                                 lowestrev = min([self.rev(n) for n in roots])
                             else:
                                 # No more roots?  Return empty list
                                 return nonodes
                         else:
                             # We are descending from nullid, and don't need to care about
                             # any other roots.
                             lowestrev = nullrev
                             roots = [nullid]
                     # Transform our roots list into a 'set' (i.e. a dictionary where the
                     # values don't matter.
                     descendents = dict.fromkeys(roots, 1)
                     # Also, keep the original roots so we can filter out roots that aren't
                     # 'real' roots (i.e. are descended from other roots).
                     roots = descendents.copy()
                     # Our topologically sorted list of output nodes.
                     orderedout = []
                     # Don't start at nullid since we don't want nullid in our output list,
                     # and if nullid shows up in descedents, empty parents will look like
                     # they're descendents.
                     for r in xrange(max(lowestrev, 0), highestrev + 1):
                         n = self.node(r)
                         isdescendent = False
                         if lowestrev == nullrev:  # Everybody is a descendent of nullid
                             isdescendent = True
                         elif n in descendents:
                             # n is already a descendent
                             isdescendent = True
                             # This check only needs to be done here because all the roots
                             # will start being marked is descendents before the loop.
                             if n in roots:
                                 # If n was a root, check if it's a 'real' root.
                                 p = tuple(self.parents(n))
                                 # If any of its parents are descendents, it's not a root.
                                 if (p[0] in descendents) or (p[1] in descendents):
                                     roots.pop(n)
                         else:
                             p = tuple(self.parents(n))
                             # A node is a descendent if either of its parents are
                             # descendents.  (We seeded the dependents list with the roots
                             # up there, remember?)
                             if (p[0] in descendents) or (p[1] in descendents):
                                 descendents[n] = 1
                                 isdescendent = True
                         if isdescendent and ((ancestors is None) or (n in ancestors)):
                             # Only include nodes that are both descendents and ancestors.
                             orderedout.append(n)
                             if (ancestors is not None) and (n in heads):
                                 # We're trying to figure out which heads are reachable
                                 # from roots.
                                 # Mark this head as having been reached
                                 heads[n] = 1
                             elif ancestors is None:
                                 # Otherwise, we're trying to discover the heads.
                                 # Assume this is a head because if it isn't, the next step
                                 # will eventually remove it.
                                 heads[n] = 1
                                 # But, obviously its parents aren't.
                                 for p in self.parents(n):
                                     heads.pop(p, None)
                     heads = [n for n in heads.iterkeys() if heads[n] != 0]
                     roots = roots.keys()
                     assert orderedout
                     assert roots
                     assert heads
                     return (orderedout, roots, heads)
                 def heads(self, start=None, stop=None):
                     """return the list of all nodes that have no children
                     if start is specified, only heads that are descendants of
                     start will be returned
                     if stop is specified, it will consider all the revs from stop
                     as if they had no children
                     """
                     if start is None:
                         start = nullid
                     if stop is None:
                         stop = []
                     stoprevs = dict.fromkeys([self.rev(n) for n in stop])
                     startrev = self.rev(start)
                     reachable = {startrev: 1}
                     heads = {startrev: 1}
                     parentrevs = self.parentrevs
                     for r in xrange(startrev + 1, self.count()):
                         for p in parentrevs(r):
                             if p in reachable:
                                 if r not in stoprevs:
                                     reachable[r] = 1
                                 heads[r] = 1
                             if p in heads and p not in stoprevs:
                                 del heads[p]
                     return [self.node(r) for r in heads]
                 def children(self, node):
                     """find the children of a given node"""
                     c = []
                     p = self.rev(node)
                     for r in range(p + 1, self.count()):
                         prevs = [pr for pr in self.parentrevs(r) if pr != nullrev]
                         if prevs:
                             for pr in prevs:
                                 if pr == p:
                                     c.append(self.node(r))
                         elif p == nullrev:
                             c.append(self.node(r))
                     return c
                 def _match(self, id):
                     if isinstance(id, (long, int)):
                         # rev
                         return self.node(id)
                     if len(id) == 20:
                         # possibly a binary node
                         # odds of a binary node being all hex in ASCII are 1 in 10**25
                         try:
                             node = id
                             r = self.rev(node) # quick search the index
                             return node
                         except LookupError:
                             pass # may be partial hex id
                     try:
                         # str(rev)
                         rev = int(id)
                         if str(rev) != id:
                             raise ValueError
                         if rev < 0:
                             rev = self.count() + rev
                         if rev < 0 or rev >= self.count():
                             raise ValueError
                         return self.node(rev)
                     except (ValueError, OverflowError):
                         pass
                     if len(id) == 40:
                         try:
                             # a full hex nodeid?
                             node = bin(id)
                             r = self.rev(node)
                             return node
                         except TypeError:
                             pass
                 def _partialmatch(self, id):
                     if len(id) < 40:
                         try:
                             # hex(node)[:...]
                             bin_id = bin(id[:len(id) & ~1]) # grab an even number of digits
                             node = None
                             for n in self.nodemap:
                                 if n.startswith(bin_id) and hex(n).startswith(id):
                                     if node is not None:
                                         raise LookupError(_("Ambiguous identifier"))
                                     node = n
                             if node is not None:
                                 return node
                         except TypeError:
                             pass
                 def lookup(self, id):
                     """locate a node based on:
                         - revision number or str(revision number)
                         - nodeid or subset of hex nodeid
                     """
                     n = self._match(id)
                     if n is not None:
                         return n
                     n = self._partialmatch(id)
                     if n:
                         return n
                     raise LookupError(_("No match found"))
                 def cmp(self, node, text):
                     """compare text with a given file revision"""
                     p1, p2 = self.parents(node)
                     return hash(text, p1, p2) != node
-                def diff(self, a, b):
-                    """return a delta between two revisions"""
-                    return mdiff.textdiff(a, b)
-                def patches(self, t, pl):
-                    """apply a list of patches to a string"""
-                    return mdiff.patches(t, pl)
                 def chunk(self, rev, df=None):
                     start, length = self.start(rev), self.length(rev)
                     if self._inline:
                         start += (rev + 1) * self._io.size
                     end = start + length
                     def loadcache(df):
                         cache_length = max(65536, length)
                         if not df:
                             if self._inline:
                                 df = self.opener(self.indexfile)
                             else:
                                 df = self.opener(self.datafile)
                         df.seek(start)
                         self._chunkcache = (start, df.read(cache_length))
                     if not self._chunkcache:
                         loadcache(df)
                     cache_start = self._chunkcache[0]
                     cache_end = cache_start + len(self._chunkcache[1])
                     if start >= cache_start and end <= cache_end:
                         # it is cached
                         offset = start - cache_start
                     else:
                         loadcache(df)
                         offset = 0
                     # avoid copying large chunks
                     c = self._chunkcache[1]
                     if len(c) > length:
                         c = c[offset:offset + length]
                     return decompress(c)
                 def delta(self, node):
                     """return or calculate a delta between a node and its predecessor"""
                     r = self.rev(node)
                     return self.revdiff(r - 1, r)
                 def revdiff(self, rev1, rev2):
                     """return or calculate a delta between two revisions"""
                     b1 = self.base(rev1)
                     b2 = self.base(rev2)
                     if b1 == b2 and rev1 + 1 == rev2:
                         return self.chunk(rev2)
                     else:
-                        return self.diff(self.revision(self.node(rev1)),
+                        return mdiff.textdiff(self.revision(self.node(rev1)),
-                                         self.revision(self.node(rev2)))
+                                              self.revision(self.node(rev2)))
                 def revision(self, node):
                     """return an uncompressed revision of a given"""
                     if node == nullid:
                         return ""
                     if self._cache and self._cache[0] == node:
                         return self._cache[2]
                     # look up what we need to read
                     text = None
                     rev = self.rev(node)
                     base = self.base(rev)
                     if self._inline:
                         # we probably have the whole chunk cached
                         df = None
                     else:
                         df = self.opener(self.datafile)
                     # do we have useful data cached?
                     if self._cache and self._cache[1] >= base and self._cache[1] < rev:
                         base = self._cache[1]
                         text = self._cache[2]
                         self._loadindex(base, rev + 1)
                     else:
                         self._loadindex(base, rev + 1)
                         text = self.chunk(base, df=df)
-                    bins = []
+                    bins = [self.chunk(r, df) for r in xrange(base + 1, rev + 1)]
-                    for r in xrange(base + 1, rev + 1):
+                    text = mdiff.patches(text, bins)
-                        bins.append(self.chunk(r, df=df))
-                    text = self.patches(text, bins)
                     p1, p2 = self.parents(node)
                     if node != hash(text, p1, p2):
                         raise RevlogError(_("integrity check failed on %s:%d")
                                           % (self.datafile, rev))
                     self._cache = (node, rev, text)
                     return text
                 def checkinlinesize(self, tr, fp=None):
                     if not self._inline:
                         return
                     if not fp:
                         fp = self.opener(self.indexfile, 'r')
                         fp.seek(0, 2)
                     size = fp.tell()
                     if size < 131072:
                         return
                     trinfo = tr.find(self.indexfile)
                     if trinfo == None:
                         raise RevlogError(_("%s not found in the transaction")
                                           % self.indexfile)
                     trindex = trinfo[2]
                     dataoff = self.start(trindex)
                     tr.add(self.datafile, dataoff)
                     df = self.opener(self.datafile, 'w')
                     calc = self._io.size
                     for r in xrange(self.count()):
                         start = self.start(r) + (r + 1) * calc
                         length = self.length(r)
                         fp.seek(start)
                         d = fp.read(length)
                         df.write(d)
                     fp.close()
                     df.close()
                     fp = self.opener(self.indexfile, 'w', atomictemp=True)
                     self.version &= ~(REVLOGNGINLINEDATA)
                     self._inline = False
                     for i in xrange(self.count()):
                         e = self._io.packentry(self.index[i], self.node, self.version)
                         fp.write(e)
                     # if we don't call rename, the temp file will never replace the
                     # real index
                     fp.rename()
                     tr.replace(self.indexfile, trindex * calc)
                     self._chunkcache = None
                 def addrevision(self, text, transaction, link, p1, p2, d=None):
                     """add a revision to the log
                     text - the revision data to add
                     transaction - the transaction object used for rollback
                     link - the linkrev data to add
                     p1, p2 - the parent nodeids of the revision
                     d - an optional precomputed delta
                     """
                     dfh = None
                     if not self._inline:
                         dfh = self.opener(self.datafile, "a")
                     ifh = self.opener(self.indexfile, "a+")
                     return self._addrevision(text, transaction, link, p1, p2, d, ifh, dfh)
                 def _addrevision(self, text, transaction, link, p1, p2, d, ifh, dfh):
                     node = hash(text, p1, p2)
                     if node in self.nodemap:
                         return node
                     curr = self.count()
                     prev = curr - 1
                     base = self.base(prev)
                     offset = self.end(prev)
                     if curr:
                         if not d:
                             ptext = self.revision(self.node(prev))
-                            d = self.diff(ptext, text)
+                            d = mdiff.textdiff(ptext, text)
                         data = compress(d)
                         l = len(data[1]) + len(data[0])
                         dist = l + offset - self.start(base)
                     # full versions are inserted when the needed deltas
                     # become comparable to the uncompressed text
                     if not curr or dist > len(text) * 2:
                         data = compress(text)
                         l = len(data[1]) + len(data[0])
                         base = curr
                     e = (offset_type(offset, 0), l, len(text),
                          base, link, self.rev(p1), self.rev(p2), node)
                     self.index.insert(-1, e)
                     self.nodemap[node] = curr
                     entry = self._io.packentry(e, self.node, self.version)
                     if not self._inline:
                         transaction.add(self.datafile, offset)
                         transaction.add(self.indexfile, curr * len(entry))
                         if data[0]:
                             dfh.write(data[0])
                         dfh.write(data[1])
                         dfh.flush()
                         ifh.write(entry)
                     else:
                         ifh.seek(0, 2)
                         transaction.add(self.indexfile, ifh.tell(), prev)
                         ifh.write(entry)
                         ifh.write(data[0])
                         ifh.write(data[1])
                         self.checkinlinesize(transaction, ifh)
                     self._cache = (node, curr, text)
                     return node
                 def ancestor(self, a, b):
                     """calculate the least common ancestor of nodes a and b"""
                     def parents(rev):
                         return [p for p in self.parentrevs(rev) if p != nullrev]
                     c = ancestor.ancestor(self.rev(a), self.rev(b), parents)
                     if c is None:
                         return nullid
                     return self.node(c)
                 def group(self, nodelist, lookup, infocollect=None):
                     """calculate a delta group
                     Given a list of changeset revs, return a set of deltas and
                     metadata corresponding to nodes. the first delta is
                     parent(nodes[0]) -> nodes[0] the receiver is guaranteed to
                     have this parent as it has all history before these
                     changesets. parent is parent[0]
                     """
                     revs = [self.rev(n) for n in nodelist]
                     # if we don't have any revisions touched by these changesets, bail
                     if not revs:
                         yield changegroup.closechunk()
                         return
                     # add the parent of the first rev
                     p = self.parents(self.node(revs[0]))[0]
                     revs.insert(0, self.rev(p))
                     # build deltas
                     for d in xrange(0, len(revs) - 1):
                         a, b = revs[d], revs[d + 1]
                         nb = self.node(b)
                         if infocollect is not None:
                             infocollect(nb)
                         d = self.revdiff(a, b)
                         p = self.parents(nb)
                         meta = nb + p[0] + p[1] + lookup(nb)
                         yield changegroup.genchunk("%s%s" % (meta, d))
                     yield changegroup.closechunk()
                 def addgroup(self, revs, linkmapper, transaction, unique=0):
                     """
                     add a delta group
                     given a set of deltas, add them to the revision log. the
                     first delta is against its parent, which should be in our
                     log, the rest are against the previous delta.
                     """
                     #track the base of the current delta log
                     r = self.count()
                     t = r - 1
                     node = None
                     base = prev = nullrev
                     start = end = textlen = 0
                     if r:
                         end = self.end(t)
                     ifh = self.opener(self.indexfile, "a+")
                     ifh.seek(0, 2)
                     transaction.add(self.indexfile, ifh.tell(), self.count())
                     if self._inline:
                         dfh = None
                     else:
                         transaction.add(self.datafile, end)
                         dfh = self.opener(self.datafile, "a")
                     # loop through our set of deltas
                     chain = None
                     for chunk in revs:
                         node, p1, p2, cs = struct.unpack("20s20s20s20s", chunk[:80])
                         link = linkmapper(cs)
                         if node in self.nodemap:
                             # this can happen if two branches make the same change
                             # if unique:
                             #    raise RevlogError(_("already have %s") % hex(node[:4]))
                             chain = node
                             continue
                         delta = chunk[80:]
                         for p in (p1, p2):
                             if not p in self.nodemap:
                                 raise LookupError(_("unknown parent %s") % short(p))
                         if not chain:
                             # retrieve the parent revision of the delta chain
                             chain = p1
                             if not chain in self.nodemap:
                                 raise LookupError(_("unknown base %s") % short(chain[:4]))
                         # full versions are inserted when the needed deltas become
                         # comparable to the uncompressed text or when the previous
                         # version is not the one we have a delta against. We use
                         # the size of the previous full rev as a proxy for the
                         # current size.
                         if chain == prev:
                             tempd = compress(delta)
                             cdelta = tempd[0] + tempd[1]
                             textlen = mdiff.patchedsize(textlen, delta)
                         if chain != prev or (end - start + len(cdelta)) > textlen * 2:
                             # flush our writes here so we can read it in revision
                             if dfh:
                                 dfh.flush()
                             ifh.flush()
                             text = self.revision(chain)
-                            text = self.patches(text, [delta])
+                            text = mdiff.patches(text, [delta])
                             chk = self._addrevision(text, transaction, link, p1, p2, None,
                                                     ifh, dfh)
                             if not dfh and not self._inline:
                                 # addrevision switched from inline to conventional
                                 # reopen the index
                                 dfh = self.opener(self.datafile, "a")
                                 ifh = self.opener(self.indexfile, "a")
                             if chk != node:
                                 raise RevlogError(_("consistency error adding group"))
                             textlen = len(text)
                         else:
                             e = (offset_type(end, 0), len(cdelta), textlen, base,
                                  link, self.rev(p1), self.rev(p2), node)
                             self.index.insert(-1, e)
                             self.nodemap[node] = r
                             entry = self._io.packentry(e, self.node, self.version)
                             if self._inline:
                                 ifh.write(entry)
                                 ifh.write(cdelta)
                                 self.checkinlinesize(transaction, ifh)
                                 if not self._inline:
                                     dfh = self.opener(self.datafile, "a")
                                     ifh = self.opener(self.indexfile, "a")
                             else:
                                 dfh.write(cdelta)
                                 ifh.write(entry)
                         t, r, chain, prev = r, r + 1, node, node
                         base = self.base(t)
                         start = self.start(base)
                         end = self.end(t)
                     return node
                 def strip(self, rev, minlink):
                     if self.count() == 0 or rev >= self.count():
                         return
                     if isinstance(self.index, lazyindex):
                         self._loadindexmap()
                     # When stripping away a revision, we need to make sure it
                     # does not actually belong to an older changeset.
                     # The minlink parameter defines the oldest revision
                     # we're allowed to strip away.
                     while minlink > self.index[rev][4]:
                         rev += 1
                         if rev >= self.count():
                             return
                     # first truncate the files on disk
                     end = self.start(rev)
                     if not self._inline:
                         df = self.opener(self.datafile, "a")
                         df.truncate(end)
                         end = rev * self._io.size
                     else:
                         end += rev * self._io.size
                     indexf = self.opener(self.indexfile, "a")
                     indexf.truncate(end)
                     # then reset internal state in memory to forget those revisions
                     self._cache = None
                     self._chunkcache = None
                     for x in xrange(rev, self.count()):
                         del self.nodemap[self.node(x)]
                     del self.index[rev:-1]
                 def checksize(self):
                     expected = 0
                     if self.count():
                         expected = self.end(self.count() - 1)
                     try:
                         f = self.opener(self.datafile)
                         f.seek(0, 2)
                         actual = f.tell()
                         dd = actual - expected
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         dd = 0
                     try:
                         f = self.opener(self.indexfile)
                         f.seek(0, 2)
                         actual = f.tell()
                         s = self._io.size
                         i = actual / s
                         di = actual - (i * s)
                         if self._inline:
                             databytes = 0
                             for r in xrange(self.count()):
                                 databytes += self.length(r)
                             dd = 0
                             di = actual - self.count() * s - databytes
                     except IOError, inst:
                         if inst.errno != errno.ENOENT:
                             raise
                         di = 0
                     return (dd, di)