upstream/mercurial-mirror Commit - r24405:cbe9d50d

1

# manifest.py - manifest revision class for mercurial

1

# manifest.py - manifest revision class for mercurial

2

#

2

#

3

4

#

4

#

5

# This software may be used and distributed according to the terms of the

5

# This software may be used and distributed according to the terms of the

6

# GNU General Public License version 2 or any later version.

6

# GNU General Public License version 2 or any later version.

7

8

from i18n import _

8

from i18n import _

9

import mdiff, parsers, error, revlog, util, scmutil

9

import mdiff, parsers, error, revlog, util, scmutil

10

import array, struct

10

import array, struct

11

12

propertycache = util.propertycache

12

propertycache = util.propertycache

13

14

class _lazymanifest(dict):

14

class _lazymanifest(dict):

15

"""This is the pure implementation of lazymanifest.

15

"""This is the pure implementation of lazymanifest.

16

17

It has not been optimized *at all* and is not lazy.

17

It has not been optimized *at all* and is not lazy.

18

"""

18

"""

19

20

def __init__(self, data):

20

def __init__(self, data):

21

# This init method does a little bit of excessive-looking

21

# This init method does a little bit of excessive-looking

22

# precondition checking. This is so that the behavior of this

22

# precondition checking. This is so that the behavior of this

23

# class exactly matches its C counterpart to try and help

23

# class exactly matches its C counterpart to try and help

24

# prevent surprise breakage for anyone that develops against

24

# prevent surprise breakage for anyone that develops against

25

# the pure version.

25

# the pure version.

26

if data and data[-1] != '\n':

26

if data and data[-1] != '\n':

27

raise ValueError('Manifest did not end in a newline.')

27

raise ValueError('Manifest did not end in a newline.')

28

dict.__init__(self)

28

dict.__init__(self)

29

prev = None

29

prev = None

30

for l in data.splitlines():

30

for l in data.splitlines():

31

if prev is not None and prev > l:

31

if prev is not None and prev > l:

32

raise ValueError('Manifest lines not in sorted order.')

32

raise ValueError('Manifest lines not in sorted order.')

33

prev = l

33

prev = l

34

f, n = l.split('\0')

34

f, n = l.split('\0')

35

if len(n) > 40:

35

if len(n) > 40:

36

self[f] = revlog.bin(n[:40]), n[40:]

36

self[f] = revlog.bin(n[:40]), n[40:]

37

else:

37

else:

38

self[f] = revlog.bin(n), ''

38

self[f] = revlog.bin(n), ''

39

40

def __setitem__(self, k, v):

40

def __setitem__(self, k, v):

41

node, flag = v

41

node, flag = v

42

assert node is not None

42

assert node is not None

43

if len(node) > 21:

43

if len(node) > 21:

44

node = node[:21] # match c implementation behavior

44

node = node[:21] # match c implementation behavior

45

dict.__setitem__(self, k, (node, flag))

45

dict.__setitem__(self, k, (node, flag))

46

47

def __iter__(self):

47

def __iter__(self):

48

return iter(sorted(dict.keys(self)))

48

return iter(sorted(dict.keys(self)))

49

50

def iterkeys(self):

50

def iterkeys(self):

51

return iter(sorted(dict.keys(self)))

51

return iter(sorted(dict.keys(self)))

52

53

def iterentries(self):

53

def iterentries(self):

54

return ((f, e[0], e[1]) for f, e in sorted(self.iteritems()))

54

return ((f, e[0], e[1]) for f, e in sorted(self.iteritems()))

55

56

def copy(self):

56

def copy(self):

57

c = _lazymanifest('')

57

c = _lazymanifest('')

58

c.update(self)

58

c.update(self)

59

return c

59

return c

60

61

def diff(self, m2, clean=False):

61

def diff(self, m2, clean=False):

62

'''Finds changes between the current manifest and m2.'''

62

'''Finds changes between the current manifest and m2.'''

63

diff = {}

63

diff = {}

64

65

for fn, e1 in self.iteritems():

65

for fn, e1 in self.iteritems():

66

if fn not in m2:

66

if fn not in m2:

67

diff[fn] = e1, (None, '')

67

diff[fn] = e1, (None, '')

68

else:

68

else:

69

e2 = m2[fn]

69

e2 = m2[fn]

70

if e1 != e2:

70

if e1 != e2:

71

diff[fn] = e1, e2

71

diff[fn] = e1, e2

72

elif clean:

72

elif clean:

73

diff[fn] = None

73

diff[fn] = None

74

75

for fn, e2 in m2.iteritems():

75

for fn, e2 in m2.iteritems():

76

if fn not in self:

76

if fn not in self:

77

diff[fn] = (None, ''), e2

77

diff[fn] = (None, ''), e2

78

79

return diff

79

return diff

80

81

def filtercopy(self, filterfn):

81

def filtercopy(self, filterfn):

82

c = _lazymanifest('')

82

c = _lazymanifest('')

83

for f, n, fl in self.iterentries():

83

for f, n, fl in self.iterentries():

84

if filterfn(f):

84

if filterfn(f):

85

c[f] = n, fl

85

c[f] = n, fl

86

return c

86

return c

87

88

def text(self):

88

def text(self):

89

"""Get the full data of this manifest as a bytestring."""

89

"""Get the full data of this manifest as a bytestring."""

90

fl = sorted(self.iterentries())

90

fl = sorted(self.iterentries())

91

92

_hex = revlog.hex

92

_hex = revlog.hex

93

# if this is changed to support newlines in filenames,

93

# if this is changed to support newlines in filenames,

94

# be sure to check the templates/ dir again (especially *-raw.tmpl)

94

# be sure to check the templates/ dir again (especially *-raw.tmpl)

95

return ''.join("%s\0%s%s\n" % (

95

return ''.join("%s\0%s%s\n" % (

96

f, _hex(n[:20]), flag) for f, n, flag in fl)

96

f, _hex(n[:20]), flag) for f, n, flag in fl)

97

98

try:

98

try:

99

_lazymanifest = parsers.lazymanifest

99

_lazymanifest = parsers.lazymanifest

100

except AttributeError:

100

except AttributeError:

101

pass

101

pass

102

103

class manifestdict(object):

103

class manifestdict(object):

104

def __init__(self, data=''):

104

def __init__(self, data=''):

105

self._lm = _lazymanifest(data)

105

self._lm = _lazymanifest(data)

106

107

def __getitem__(self, key):

107

def __getitem__(self, key):

108

return self._lm[key][0]

108

return self._lm[key][0]

109

110

def find(self, key):

110

def find(self, key):

111

return self._lm[key]

111

return self._lm[key]

112

113

def __len__(self):

113

def __len__(self):

114

return len(self._lm)

114

return len(self._lm)

115

116

def __setitem__(self, key, node):

116

def __setitem__(self, key, node):

117

self._lm[key] = node, self.flags(key, '')

117

self._lm[key] = node, self.flags(key, '')

118

119

def __contains__(self, key):

119

def __contains__(self, key):

120

return key in self._lm

120

return key in self._lm

121

122

def __delitem__(self, key):

122

def __delitem__(self, key):

123

del self._lm[key]

123

del self._lm[key]

124

125

def __iter__(self):

125

def __iter__(self):

126

return self._lm.__iter__()

126

return self._lm.__iter__()

127

128

def iterkeys(self):

128

def iterkeys(self):

129

return self._lm.iterkeys()

129

return self._lm.iterkeys()

130

131

def keys(self):

131

def keys(self):

132

return list(self.iterkeys())

132

return list(self.iterkeys())

133

134

def intersectfiles(self, files):

134

def intersectfiles(self, files):

135

'''make a new lazymanifest with the intersection of self with files

135

'''make a new lazymanifest with the intersection of self with files

136

137

The algorithm assumes that files is much smaller than self.'''

137

The algorithm assumes that files is much smaller than self.'''

138

ret = manifestdict()

138

ret = manifestdict()

139

lm = self._lm

139

lm = self._lm

140

for fn in files:

140

for fn in files:

141

if fn in lm:

141

if fn in lm:

142

ret._lm[fn] = self._lm[fn]

142

ret._lm[fn] = self._lm[fn]

143

return ret

143

return ret

144

145

def filesnotin(self, m2):

145

def filesnotin(self, m2):

146

'''Set of files in this manifest that are not in the other'''

146

'''Set of files in this manifest that are not in the other'''

147

files = set(self)

147

files = set(self)

148

files.difference_update(m2)

148

files.difference_update(m2)

149

return files

149

return files

150

151

@propertycache

151

@propertycache

152

def _dirs(self):

152

def _dirs(self):

153

return scmutil.dirs(self)

153

return scmutil.dirs(self)

154

155

def dirs(self):

155

def dirs(self):

156

return self._dirs

156

return self._dirs

157

158

def hasdir(self, dir):

158

def hasdir(self, dir):

159

return dir in self._dirs

159

return dir in self._dirs

160

161

def matches(self, match):

161

def matches(self, match):

162

'''generate a new manifest filtered by the match argument'''

162

'''generate a new manifest filtered by the match argument'''

163

if match.always():

163

if match.always():

164

return self.copy()

164

return self.copy()

165

166

files = match.files()

166

files = match.files()

167

if (len(files) < 100 and (match.matchfn == match.exact or

167

if (len(files) < 100 and (match.matchfn == match.exact or

168

(not match.anypats() and util.all(fn in self for fn in files)))):

168

(not match.anypats() and util.all(fn in self for fn in files)))):

169

return self.intersectfiles(files)

169

return self.intersectfiles(files)

170

171

lm = manifestdict('')

171

lm = manifestdict('')

172

lm._lm = self._lm.filtercopy(match)

172

lm._lm = self._lm.filtercopy(match)

173

return lm

173

return lm

174

175

def diff(self, m2, clean=False):

175

def diff(self, m2, clean=False):

176

'''Finds changes between the current manifest and m2.

176

'''Finds changes between the current manifest and m2.

177

178

Args:

178

Args:

179

m2: the manifest to which this manifest should be compared.

179

m2: the manifest to which this manifest should be compared.

180

clean: if true, include files unchanged between these manifests

180

clean: if true, include files unchanged between these manifests

181

with a None value in the returned dictionary.

181

with a None value in the returned dictionary.

182

183

The result is returned as a dict with filename as key and

183

The result is returned as a dict with filename as key and

184

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

184

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

185

nodeid in the current/other manifest and fl1/fl2 is the flag

185

nodeid in the current/other manifest and fl1/fl2 is the flag

186

in the current/other manifest. Where the file does not exist,

186

in the current/other manifest. Where the file does not exist,

187

the nodeid will be None and the flags will be the empty

187

the nodeid will be None and the flags will be the empty

188

string.

188

string.

189

'''

189

'''

190

return self._lm.diff(m2._lm, clean)

190

return self._lm.diff(m2._lm, clean)

191

192

def setflag(self, key, flag):

192

def setflag(self, key, flag):

193

self._lm[key] = self[key], flag

193

self._lm[key] = self[key], flag

194

195

def get(self, key, default=None):

195

def get(self, key, default=None):

196

try:

196

try:

197

return self._lm[key][0]

197

return self._lm[key][0]

198

except KeyError:

198

except KeyError:

199

return default

199

return default

200

201

def flags(self, key, default=''):

201

def flags(self, key, default=''):

202

try:

202

try:

203

return self._lm[key][1]

203

return self._lm[key][1]

204

except KeyError:

204

except KeyError:

205

return default

205

return default

206

207

def copy(self):

207

def copy(self):

208

c = manifestdict('')

208

c = manifestdict('')

209

c._lm = self._lm.copy()

209

c._lm = self._lm.copy()

210

return c

210

return c

211

212

def iteritems(self):

212

def iteritems(self):

213

return (x[:2] for x in self._lm.iterentries())

213

return (x[:2] for x in self._lm.iterentries())

214

215

def text(self):

215

def text(self):

216

return self._lm.text()

216

return self._lm.text()

217

218

def fastdelta(self, base, changes):

218

def fastdelta(self, base, changes):

219

"""Given a base manifest text as an array.array and a list of changes

219

"""Given a base manifest text as an array.array and a list of changes

220

relative to that text, compute a delta that can be used by revlog.

220

relative to that text, compute a delta that can be used by revlog.

221

"""

221

"""

222

delta = []

222

delta = []

223

dstart = None

223

dstart = None

224

dend = None

224

dend = None

225

dline = [""]

225

dline = [""]

226

start = 0

226

start = 0

227

# zero copy representation of base as a buffer

227

# zero copy representation of base as a buffer

228

addbuf = util.buffer(base)

228

addbuf = util.buffer(base)

229

230

# start with a readonly loop that finds the offset of

230

# start with a readonly loop that finds the offset of

231

# each line and creates the deltas

231

# each line and creates the deltas

232

for f, todelete in changes:

232

for f, todelete in changes:

233

# bs will either be the index of the item or the insert point

233

# bs will either be the index of the item or the insert point

234

start, end = _msearch(addbuf, f, start)

234

start, end = _msearch(addbuf, f, start)

235

if not todelete:

235

if not todelete:

236

h, fl = self._lm[f]

236

h, fl = self._lm[f]

237

l = "%s\0%s%s\n" % (f, revlog.hex(h), fl)

237

l = "%s\0%s%s\n" % (f, revlog.hex(h), fl)

238

else:

238

else:

239

if start == end:

239

if start == end:

240

# item we want to delete was not found, error out

240

# item we want to delete was not found, error out

241

raise AssertionError(

241

raise AssertionError(

242

_("failed to remove %s from manifest") % f)

242

_("failed to remove %s from manifest") % f)

243

l = ""

243

l = ""

244

if dstart is not None and dstart <= start and dend >= start:

244

if dstart is not None and dstart <= start and dend >= start:

245

if dend < end:

245

if dend < end:

246

dend = end

246

dend = end

247

if l:

247

if l:

248

dline.append(l)

248

dline.append(l)

249

else:

249

else:

250

if dstart is not None:

250

if dstart is not None:

251

delta.append([dstart, dend, "".join(dline)])

251

delta.append([dstart, dend, "".join(dline)])

252

dstart = start

252

dstart = start

253

dend = end

253

dend = end

254

dline = [l]

254

dline = [l]

255

256

if dstart is not None:

256

if dstart is not None:

257

delta.append([dstart, dend, "".join(dline)])

257

delta.append([dstart, dend, "".join(dline)])

258

# apply the delta to the base, and get a delta for addrevision

258

# apply the delta to the base, and get a delta for addrevision

259

deltatext, arraytext = _addlistdelta(base, delta)

259

deltatext, arraytext = _addlistdelta(base, delta)

260

return arraytext, deltatext

260

return arraytext, deltatext

261

262

def _msearch(m, s, lo=0, hi=None):

262

def _msearch(m, s, lo=0, hi=None):

263

'''return a tuple (start, end) that says where to find s within m.

263

'''return a tuple (start, end) that says where to find s within m.

264

265

If the string is found m[start:end] are the line containing

265

If the string is found m[start:end] are the line containing

266

that string. If start == end the string was not found and

266

that string. If start == end the string was not found and

267

they indicate the proper sorted insertion point.

267

they indicate the proper sorted insertion point.

268

269

m should be a buffer or a string

269

m should be a buffer or a string

270

s is a string'''

270

s is a string'''

271

def advance(i, c):

271

def advance(i, c):

272

while i < lenm and m[i] != c:

272

while i < lenm and m[i] != c:

273

i += 1

273

i += 1

274

return i

274

return i

275

if not s:

275

if not s:

276

return (lo, lo)

276

return (lo, lo)

277

lenm = len(m)

277

lenm = len(m)

278

if not hi:

278

if not hi:

279

hi = lenm

279

hi = lenm

280

while lo < hi:

280

while lo < hi:

281

mid = (lo + hi) // 2

281

mid = (lo + hi) // 2

282

start = mid

282

start = mid

283

while start > 0 and m[start - 1] != '\n':

283

while start > 0 and m[start - 1] != '\n':

284

start -= 1

284

start -= 1

285

end = advance(start, '\0')

285

end = advance(start, '\0')

286

if m[start:end] < s:

286

if m[start:end] < s:

287

# we know that after the null there are 40 bytes of sha1

287

# we know that after the null there are 40 bytes of sha1

288

# this translates to the bisect lo = mid + 1

288

# this translates to the bisect lo = mid + 1

289

lo = advance(end + 40, '\n') + 1

289

lo = advance(end + 40, '\n') + 1

290

else:

290

else:

291

# this translates to the bisect hi = mid

291

# this translates to the bisect hi = mid

292

hi = start

292

hi = start

293

end = advance(lo, '\0')

293

end = advance(lo, '\0')

294

found = m[lo:end]

294

found = m[lo:end]

295

if s == found:

295

if s == found:

296

# we know that after the null there are 40 bytes of sha1

296

# we know that after the null there are 40 bytes of sha1

297

end = advance(end + 40, '\n')

297

end = advance(end + 40, '\n')

298

return (lo, end + 1)

298

return (lo, end + 1)

299

else:

299

else:

300

return (lo, lo)

300

return (lo, lo)

301

302

def _checkforbidden(l):

302

def _checkforbidden(l):

303

"""Check filenames for illegal characters."""

303

"""Check filenames for illegal characters."""

304

for f in l:

304

for f in l:

305

if '\n' in f or '\r' in f:

305

if '\n' in f or '\r' in f:

306

raise error.RevlogError(

306

raise error.RevlogError(

307

_("'\\n' and '\\r' disallowed in filenames: %r") % f)

307

_("'\\n' and '\\r' disallowed in filenames: %r") % f)

308

309

310

# apply the changes collected during the bisect loop to our addlist

310

# apply the changes collected during the bisect loop to our addlist

311

# return a delta suitable for addrevision

311

# return a delta suitable for addrevision

312

def _addlistdelta(addlist, x):

312

def _addlistdelta(addlist, x):

313

# for large addlist arrays, building a new array is cheaper

313

# for large addlist arrays, building a new array is cheaper

314

# than repeatedly modifying the existing one

314

# than repeatedly modifying the existing one

315

currentposition = 0

315

currentposition = 0

316

newaddlist = array.array('c')

316

newaddlist = array.array('c')

317

318

for start, end, content in x:

318

for start, end, content in x:

319

newaddlist += addlist[currentposition:start]

319

newaddlist += addlist[currentposition:start]

320

if content:

320

if content:

321

newaddlist += array.array('c', content)

321

newaddlist += array.array('c', content)

322

323

currentposition = end

323

currentposition = end

324

325

newaddlist += addlist[currentposition:]

325

newaddlist += addlist[currentposition:]

326

327

deltatext = "".join(struct.pack(">lll", start, end, len(content))

327

deltatext = "".join(struct.pack(">lll", start, end, len(content))

328

+ content for start, end, content in x)

328

+ content for start, end, content in x)

329

return deltatext, newaddlist

329

return deltatext, newaddlist

330

331

def _splittopdir(f):

331

def _splittopdir(f):

332

if '/' in f:

332

if '/' in f:

333

dir, subpath = f.split('/', 1)

333

dir, subpath = f.split('/', 1)

334

return dir + '/', subpath

334

return dir + '/', subpath

335

else:

335

else:

336

return '', f

336

return '', f

337

338

class treemanifest(object):

338

class treemanifest(object):

339

def __init__(self, dir='', text=''):

339

def __init__(self, dir='', text=''):

340

self._dir = dir

340

self._dir = dir

341

self._dirs = {}

341

self._dirs = {}

342

# Using _lazymanifest here is a little slower than plain old dicts

342

# Using _lazymanifest here is a little slower than plain old dicts

343

self._files = {}

343

self._files = {}

344

self._flags = {}

344

self._flags = {}

345

lm = _lazymanifest(text)

345

lm = _lazymanifest(text)

346

for f, n, fl in lm.iterentries():

346

for f, n, fl in lm.iterentries():

347

self[f] = n

347

self[f] = n

348

if fl:

348

if fl:

349

self.setflag(f, fl)

349

self.setflag(f, fl)

350

351

def _subpath(self, path):

351

def _subpath(self, path):

352

return self._dir + path

352

return self._dir + path

353

354

def __len__(self):

354

def __len__(self):

355

size = len(self._files)

355

size = len(self._files)

356

for m in self._dirs.values():

356

for m in self._dirs.values():

357

size += m.__len__()

357

size += m.__len__()

358

return size

358

return size

359

360

def __str__(self):

360

def __str__(self):

361

return '<treemanifest dir=%s>' % self._dir

361

return '<treemanifest dir=%s>' % self._dir

362

363

def iteritems(self):

363

def iteritems(self):

364

for p, n in sorted(self._dirs.items() + self._files.items()):

364

for p, n in sorted(self._dirs.items() + self._files.items()):

365

if p in self._files:

365

if p in self._files:

366

yield self._subpath(p), n

366

yield self._subpath(p), n

367

else:

367

else:

368

for f, sn in n.iteritems():

368

for f, sn in n.iteritems():

369

yield f, sn

369

yield f, sn

370

371

def iterkeys(self):

371

def iterkeys(self):

372

for p in sorted(self._dirs.keys() + self._files.keys()):

372

for p in sorted(self._dirs.keys() + self._files.keys()):

373

if p in self._files:

373

if p in self._files:

374

yield self._subpath(p)

374

yield self._subpath(p)

375

else:

375

else:

376

for f in self._dirs[p].iterkeys():

376

for f in self._dirs[p].iterkeys():

377

yield f

377

yield f

378

379

def keys(self):

379

def keys(self):

380

return list(self.iterkeys())

380

return list(self.iterkeys())

381

382

def __iter__(self):

382

def __iter__(self):

383

return self.iterkeys()

383

return self.iterkeys()

384

385

def __contains__(self, f):

385

def __contains__(self, f):

386

if f is None:

386

if f is None:

387

return False

387

return False

388

dir, subpath = _splittopdir(f)

388

dir, subpath = _splittopdir(f)

389

if dir:

389

if dir:

390

if dir not in self._dirs:

390

if dir not in self._dirs:

391

return False

391

return False

392

return self._dirs[dir].__contains__(subpath)

392

return self._dirs[dir].__contains__(subpath)

393

else:

393

else:

394

return f in self._files

394

return f in self._files

395

396

def get(self, f, default=None):

396

def get(self, f, default=None):

397

dir, subpath = _splittopdir(f)

397

dir, subpath = _splittopdir(f)

398

if dir:

398

if dir:

399

if dir not in self._dirs:

399

if dir not in self._dirs:

400

return default

400

return default

401

return self._dirs[dir].get(subpath, default)

401

return self._dirs[dir].get(subpath, default)

402

else:

402

else:

403

return self._files.get(f, default)

403

return self._files.get(f, default)

404

405

def __getitem__(self, f):

405

def __getitem__(self, f):

406

dir, subpath = _splittopdir(f)

406

dir, subpath = _splittopdir(f)

407

if dir:

407

if dir:

408

return self._dirs[dir].__getitem__(subpath)

408

return self._dirs[dir].__getitem__(subpath)

409

else:

409

else:

410

return self._files[f]

410

return self._files[f]

411

412

def flags(self, f):

412

def flags(self, f):

413

dir, subpath = _splittopdir(f)

413

dir, subpath = _splittopdir(f)

414

if dir:

414

if dir:

415

if dir not in self._dirs:

415

if dir not in self._dirs:

416

return ''

416

return ''

417

return self._dirs[dir].flags(subpath)

417

return self._dirs[dir].flags(subpath)

418

else:

418

else:

419

if f in self._dirs:

419

if f in self._dirs:

420

return ''

420

return ''

421

return self._flags.get(f, '')

421

return self._flags.get(f, '')

422

423

def find(self, f):

423

def find(self, f):

424

dir, subpath = _splittopdir(f)

424

dir, subpath = _splittopdir(f)

425

if dir:

425

if dir:

426

return self._dirs[dir].find(subpath)

426

return self._dirs[dir].find(subpath)

427

else:

427

else:

428

return self._files[f], self._flags.get(f, '')

428

return self._files[f], self._flags.get(f, '')

429

430

def __delitem__(self, f):

430

def __delitem__(self, f):

431

dir, subpath = _splittopdir(f)

431

dir, subpath = _splittopdir(f)

432

if dir:

432

if dir:

433

self._dirs[dir].__delitem__(subpath)

433

self._dirs[dir].__delitem__(subpath)

434

# If the directory is now empty, remove it

434

# If the directory is now empty, remove it

435

if not self._dirs[dir]._dirs and not self._dirs[dir]._files:

435

if not self._dirs[dir]._dirs and not self._dirs[dir]._files:

436

del self._dirs[dir]

436

del self._dirs[dir]

437

else:

437

else:

438

del self._files[f]

438

del self._files[f]

439

if f in self._flags:

439

if f in self._flags:

440

del self._flags[f]

440

del self._flags[f]

441

442

def __setitem__(self, f, n):

442

def __setitem__(self, f, n):

443

assert n is not None

443

assert n is not None

444

dir, subpath = _splittopdir(f)

444

dir, subpath = _splittopdir(f)

445

if dir:

445

if dir:

446

if dir not in self._dirs:

446

if dir not in self._dirs:

447

self._dirs[dir] = treemanifest(self._subpath(dir))

447

self._dirs[dir] = treemanifest(self._subpath(dir))

448

self._dirs[dir].__setitem__(subpath, n)

448

self._dirs[dir].__setitem__(subpath, n)

449

else:

449

else:

450

self._files[f] = n

450

self._files[f] = n

451

452

def setflag(self, f, flags):

452

def setflag(self, f, flags):

453

"""Set the flags (symlink, executable) for path f."""

453

"""Set the flags (symlink, executable) for path f."""

454

dir, subpath = _splittopdir(f)

454

dir, subpath = _splittopdir(f)

455

if dir:

455

if dir:

456

if dir not in self._dirs:

456

if dir not in self._dirs:

457

self._dirs[dir] = treemanifest(self._subpath(dir))

457

self._dirs[dir] = treemanifest(self._subpath(dir))

458

self._dirs[dir].setflag(subpath, flags)

458

self._dirs[dir].setflag(subpath, flags)

459

else:

459

else:

460

self._flags[f] = flags

460

self._flags[f] = flags

461

462

def copy(self):

462

def copy(self):

463

copy = treemanifest(self._dir)

463

copy = treemanifest(self._dir)

464

for d in self._dirs:

464

for d in self._dirs:

465

copy._dirs[d] = self._dirs[d].copy()

465

copy._dirs[d] = self._dirs[d].copy()

466

copy._files = dict.copy(self._files)

466

copy._files = dict.copy(self._files)

467

copy._flags = dict.copy(self._flags)

467

copy._flags = dict.copy(self._flags)

468

return copy

468

return copy

469

470

def intersectfiles(self, files):

470

def intersectfiles(self, files):

471

'''make a new treemanifest with the intersection of self with files

471

'''make a new treemanifest with the intersection of self with files

472

473

The algorithm assumes that files is much smaller than self.'''

473

The algorithm assumes that files is much smaller than self.'''

474

ret = treemanifest()

474

ret = treemanifest()

475

for fn in files:

475

for fn in files:

476

if fn in self:

476

if fn in self:

477

ret[fn] = self[fn]

477

ret[fn] = self[fn]

478

flags = self.flags(fn)

478

flags = self.flags(fn)

479

if flags:

479

if flags:

480

ret.setflag(fn, flags)

480

ret.setflag(fn, flags)

481

return ret

481

return ret

482

483

def filesnotin(self, m2):

483

def filesnotin(self, m2):

484

'''Set of files in this manifest that are not in the other'''

484

'''Set of files in this manifest that are not in the other'''

485

files = set(~~self~~.~~iterkeys~~())

485

files = set()

486

files.difference_update(m2.iterkeys())

486

def _filesnotin(t1, t2):

487

for d, m1 in t1._dirs.iteritems():

488

if d in t2._dirs:

489

m2 = t2._dirs[d]

490

_filesnotin(m1, m2)

491

else:

492

files.update(m1.iterkeys())

493

494

for fn in t1._files.iterkeys():

495

if fn not in t2._files:

496

files.add(t1._subpath(fn))

497

498

_filesnotin(self, m2)

487

return files

499

return files

488

500

489

@propertycache

501

@propertycache

490

def _alldirs(self):

502

def _alldirs(self):

491

return scmutil.dirs(self)

503

return scmutil.dirs(self)

492

504

493

def dirs(self):

505

def dirs(self):

494

return self._alldirs

506

return self._alldirs

495

507

496

def hasdir(self, dir):

508

def hasdir(self, dir):

497

return dir in self._alldirs

509

return dir in self._alldirs

498

510

499

def matches(self, match):

511

def matches(self, match):

500

'''generate a new manifest filtered by the match argument'''

512

'''generate a new manifest filtered by the match argument'''

501

if match.always():

513

if match.always():

502

return self.copy()

514

return self.copy()

503

515

504

files = match.files()

516

files = match.files()

505

if (match.matchfn == match.exact or

517

if (match.matchfn == match.exact or

506

(not match.anypats() and util.all(fn in self for fn in files))):

518

(not match.anypats() and util.all(fn in self for fn in files))):

507

return self.intersectfiles(files)

519

return self.intersectfiles(files)

508

520

509

m = self.copy()

521

m = self.copy()

510

for fn in m.keys():

522

for fn in m.keys():

511

if not match(fn):

523

if not match(fn):

512

del m[fn]

524

del m[fn]

513

return m

525

return m

514

526

515

def diff(self, m2, clean=False):

527

def diff(self, m2, clean=False):

516

'''Finds changes between the current manifest and m2.

528

'''Finds changes between the current manifest and m2.

517

529

518

Args:

530

Args:

519

m2: the manifest to which this manifest should be compared.

531

m2: the manifest to which this manifest should be compared.

520

clean: if true, include files unchanged between these manifests

532

clean: if true, include files unchanged between these manifests

521

with a None value in the returned dictionary.

533

with a None value in the returned dictionary.

522

534

523

The result is returned as a dict with filename as key and

535

The result is returned as a dict with filename as key and

524

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

536

values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the

525

nodeid in the current/other manifest and fl1/fl2 is the flag

537

nodeid in the current/other manifest and fl1/fl2 is the flag

526

in the current/other manifest. Where the file does not exist,

538

in the current/other manifest. Where the file does not exist,

527

the nodeid will be None and the flags will be the empty

539

the nodeid will be None and the flags will be the empty

528

string.

540

string.

529

'''

541

'''

530

result = {}

542

result = {}

531

emptytree = treemanifest()

543

emptytree = treemanifest()

532

def _diff(t1, t2):

544

def _diff(t1, t2):

533

for d, m1 in t1._dirs.iteritems():

545

for d, m1 in t1._dirs.iteritems():

534

m2 = t2._dirs.get(d, emptytree)

546

m2 = t2._dirs.get(d, emptytree)

535

_diff(m1, m2)

547

_diff(m1, m2)

536

548

537

for d, m2 in t2._dirs.iteritems():

549

for d, m2 in t2._dirs.iteritems():

538

if d not in t1._dirs:

550

if d not in t1._dirs:

539

_diff(emptytree, m2)

551

_diff(emptytree, m2)

540

552

541

for fn, n1 in t1._files.iteritems():

553

for fn, n1 in t1._files.iteritems():

542

fl1 = t1._flags.get(fn, '')

554

fl1 = t1._flags.get(fn, '')

543

n2 = t2._files.get(fn, None)

555

n2 = t2._files.get(fn, None)

544

fl2 = t2._flags.get(fn, '')

556

fl2 = t2._flags.get(fn, '')

545

if n1 != n2 or fl1 != fl2:

557

if n1 != n2 or fl1 != fl2:

546

result[t1._subpath(fn)] = ((n1, fl1), (n2, fl2))

558

result[t1._subpath(fn)] = ((n1, fl1), (n2, fl2))

547

elif clean:

559

elif clean:

548

result[t1._subpath(fn)] = None

560

result[t1._subpath(fn)] = None

549

561

550

for fn, n2 in t2._files.iteritems():

562

for fn, n2 in t2._files.iteritems():

551

if fn not in t1._files:

563

if fn not in t1._files:

552

fl2 = t2._flags.get(fn, '')

564

fl2 = t2._flags.get(fn, '')

553

result[t2._subpath(fn)] = ((None, ''), (n2, fl2))

565

result[t2._subpath(fn)] = ((None, ''), (n2, fl2))

554

566

555

_diff(self, m2)

567

_diff(self, m2)

556

return result

568

return result

557

569

558

def text(self):

570

def text(self):

559

"""Get the full data of this manifest as a bytestring."""

571

"""Get the full data of this manifest as a bytestring."""

560

fl = self.keys()

572

fl = self.keys()

561

_checkforbidden(fl)

573

_checkforbidden(fl)

562

574

563

hex, flags = revlog.hex, self.flags

575

hex, flags = revlog.hex, self.flags

564

# if this is changed to support newlines in filenames,

576

# if this is changed to support newlines in filenames,

565

# be sure to check the templates/ dir again (especially *-raw.tmpl)

577

# be sure to check the templates/ dir again (especially *-raw.tmpl)

566

return ''.join("%s\0%s%s\n" % (f, hex(self[f]), flags(f)) for f in fl)

578

return ''.join("%s\0%s%s\n" % (f, hex(self[f]), flags(f)) for f in fl)

567

579

568

class manifest(revlog.revlog):

580

class manifest(revlog.revlog):

569

def __init__(self, opener):

581

def __init__(self, opener):

570

# During normal operations, we expect to deal with not more than four

582

# During normal operations, we expect to deal with not more than four

571

# revs at a time (such as during commit --amend). When rebasing large

583

# revs at a time (such as during commit --amend). When rebasing large

572

# stacks of commits, the number can go up, hence the config knob below.

584

# stacks of commits, the number can go up, hence the config knob below.

573

cachesize = 4

585

cachesize = 4

574

usetreemanifest = False

586

usetreemanifest = False

575

opts = getattr(opener, 'options', None)

587

opts = getattr(opener, 'options', None)

576

if opts is not None:

588

if opts is not None:

577

cachesize = opts.get('manifestcachesize', cachesize)

589

cachesize = opts.get('manifestcachesize', cachesize)

578

usetreemanifest = opts.get('usetreemanifest', usetreemanifest)

590

usetreemanifest = opts.get('usetreemanifest', usetreemanifest)

579

self._mancache = util.lrucachedict(cachesize)

591

self._mancache = util.lrucachedict(cachesize)

580

revlog.revlog.__init__(self, opener, "00manifest.i")

592

revlog.revlog.__init__(self, opener, "00manifest.i")

581

self._usetreemanifest = usetreemanifest

593

self._usetreemanifest = usetreemanifest

582

594

583

def _newmanifest(self, data=''):

595

def _newmanifest(self, data=''):

584

if self._usetreemanifest:

596

if self._usetreemanifest:

585

return treemanifest('', data)

597

return treemanifest('', data)

586

return manifestdict(data)

598

return manifestdict(data)

587

599

588

def readdelta(self, node):

600

def readdelta(self, node):

589

r = self.rev(node)

601

r = self.rev(node)

590

d = mdiff.patchtext(self.revdiff(self.deltaparent(r), r))

602

d = mdiff.patchtext(self.revdiff(self.deltaparent(r), r))

591

return self._newmanifest(d)

603

return self._newmanifest(d)

592

604

593

def readfast(self, node):

605

def readfast(self, node):

594

'''use the faster of readdelta or read'''

606

'''use the faster of readdelta or read'''

595

r = self.rev(node)

607

r = self.rev(node)

596

deltaparent = self.deltaparent(r)

608

deltaparent = self.deltaparent(r)

597

if deltaparent != revlog.nullrev and deltaparent in self.parentrevs(r):

609

if deltaparent != revlog.nullrev and deltaparent in self.parentrevs(r):

598

return self.readdelta(node)

610

return self.readdelta(node)

599

return self.read(node)

611

return self.read(node)

600

612

601

def read(self, node):

613

def read(self, node):

602

if node == revlog.nullid:

614

if node == revlog.nullid:

603

return self._newmanifest() # don't upset local cache

615

return self._newmanifest() # don't upset local cache

604

if node in self._mancache:

616

if node in self._mancache:

605

return self._mancache[node][0]

617

return self._mancache[node][0]

606

text = self.revision(node)

618

text = self.revision(node)

607

arraytext = array.array('c', text)

619

arraytext = array.array('c', text)

608

m = self._newmanifest(text)

620

m = self._newmanifest(text)

609

self._mancache[node] = (m, arraytext)

621

self._mancache[node] = (m, arraytext)

610

return m

622

return m

611

623

612

def find(self, node, f):

624

def find(self, node, f):

613

'''look up entry for a single file efficiently.

625

'''look up entry for a single file efficiently.

614

return (node, flags) pair if found, (None, None) if not.'''

626

return (node, flags) pair if found, (None, None) if not.'''

615

m = self.read(node)

627

m = self.read(node)

616

try:

628

try:

617

return m.find(f)

629

return m.find(f)

618

except KeyError:

630

except KeyError:

619

return None, None

631

return None, None

620

632

621

def add(self, m, transaction, link, p1, p2, added, removed):

633

def add(self, m, transaction, link, p1, p2, added, removed):

622

if p1 in self._mancache and not self._usetreemanifest:

634

if p1 in self._mancache and not self._usetreemanifest:

623

# If our first parent is in the manifest cache, we can

635

# If our first parent is in the manifest cache, we can

624

# compute a delta here using properties we know about the

636

# compute a delta here using properties we know about the

625

# manifest up-front, which may save time later for the

637

# manifest up-front, which may save time later for the

626

# revlog layer.

638

# revlog layer.

627

639

628

_checkforbidden(added)

640

_checkforbidden(added)

629

# combine the changed lists into one list for sorting

641

# combine the changed lists into one list for sorting

630

work = [(x, False) for x in added]

642

work = [(x, False) for x in added]

631

work.extend((x, True) for x in removed)

643

work.extend((x, True) for x in removed)

632

# this could use heapq.merge() (from Python 2.6+) or equivalent

644

# this could use heapq.merge() (from Python 2.6+) or equivalent

633

# since the lists are already sorted

645

# since the lists are already sorted

634

work.sort()

646

work.sort()

635

647

636

arraytext, deltatext = m.fastdelta(self._mancache[p1][1], work)

648

arraytext, deltatext = m.fastdelta(self._mancache[p1][1], work)

637

cachedelta = self.rev(p1), deltatext

649

cachedelta = self.rev(p1), deltatext

638

text = util.buffer(arraytext)

650

text = util.buffer(arraytext)

639

else:

651

else:

640

# The first parent manifest isn't already loaded, so we'll

652

# The first parent manifest isn't already loaded, so we'll

641

# just encode a fulltext of the manifest and pass that

653

# just encode a fulltext of the manifest and pass that

642

# through to the revlog layer, and let it handle the delta

654

# through to the revlog layer, and let it handle the delta

643

# process.

655

# process.

644

text = m.text()

656

text = m.text()

645

arraytext = array.array('c', text)

657

arraytext = array.array('c', text)

646

cachedelta = None

658

cachedelta = None

647

659

648

n = self.addrevision(text, transaction, link, p1, p2, cachedelta)

660

n = self.addrevision(text, transaction, link, p1, p2, cachedelta)

649

self._mancache[n] = (m, arraytext)

661

self._mancache[n] = (m, arraytext)

650

662

651

return n

663

return n

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # manifest.py - manifest revision class for mercurial
             #
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from i18n import _
             import mdiff, parsers, error, revlog, util, scmutil
             import array, struct
             propertycache = util.propertycache
             class _lazymanifest(dict):
                 """This is the pure implementation of lazymanifest.
                 It has not been optimized *at all* and is not lazy.
                 """
                 def __init__(self, data):
                     # This init method does a little bit of excessive-looking
                     # precondition checking. This is so that the behavior of this
                     # class exactly matches its C counterpart to try and help
                     # prevent surprise breakage for anyone that develops against
                     # the pure version.
                     if data and data[-1] != '\n':
                         raise ValueError('Manifest did not end in a newline.')
                     dict.__init__(self)
                     prev = None
                     for l in data.splitlines():
                         if prev is not None and prev > l:
                             raise ValueError('Manifest lines not in sorted order.')
                         prev = l
                         f, n = l.split('\0')
                         if len(n) > 40:
                             self[f] = revlog.bin(n[:40]), n[40:]
                         else:
                             self[f] = revlog.bin(n), ''
                 def __setitem__(self, k, v):
                     node, flag = v
                     assert node is not None
                     if len(node) > 21:
                         node = node[:21] # match c implementation behavior
                     dict.__setitem__(self, k, (node, flag))
                 def __iter__(self):
                     return iter(sorted(dict.keys(self)))
                 def iterkeys(self):
                     return iter(sorted(dict.keys(self)))
                 def iterentries(self):
                     return ((f, e[0], e[1]) for f, e in sorted(self.iteritems()))
                 def copy(self):
                     c = _lazymanifest('')
                     c.update(self)
                     return c
                 def diff(self, m2, clean=False):
                     '''Finds changes between the current manifest and m2.'''
                     diff = {}
                     for fn, e1 in self.iteritems():
                         if fn not in m2:
                             diff[fn] = e1, (None, '')
                         else:
                             e2 = m2[fn]
                             if e1 != e2:
                                 diff[fn] = e1, e2
                             elif clean:
                                 diff[fn] = None
                     for fn, e2 in m2.iteritems():
                         if fn not in self:
                             diff[fn] = (None, ''), e2
                     return diff
                 def filtercopy(self, filterfn):
                     c = _lazymanifest('')
                     for f, n, fl in self.iterentries():
                         if filterfn(f):
                             c[f] = n, fl
                     return c
                 def text(self):
                     """Get the full data of this manifest as a bytestring."""
                     fl = sorted(self.iterentries())
                     _hex = revlog.hex
                     # if this is changed to support newlines in filenames,
                     # be sure to check the templates/ dir again (especially *-raw.tmpl)
                     return ''.join("%s\0%s%s\n" % (
                         f, _hex(n[:20]), flag) for f, n, flag in fl)
             try:
                 _lazymanifest = parsers.lazymanifest
             except AttributeError:
                 pass
             class manifestdict(object):
                 def __init__(self, data=''):
                     self._lm = _lazymanifest(data)
                 def __getitem__(self, key):
                     return self._lm[key][0]
                 def find(self, key):
                     return self._lm[key]
                 def __len__(self):
                     return len(self._lm)
                 def __setitem__(self, key, node):
                     self._lm[key] = node, self.flags(key, '')
                 def __contains__(self, key):
                     return key in self._lm
                 def __delitem__(self, key):
                     del self._lm[key]
                 def __iter__(self):
                     return self._lm.__iter__()
                 def iterkeys(self):
                     return self._lm.iterkeys()
                 def keys(self):
                     return list(self.iterkeys())
                 def intersectfiles(self, files):
                     '''make a new lazymanifest with the intersection of self with files
                     The algorithm assumes that files is much smaller than self.'''
                     ret = manifestdict()
                     lm = self._lm
                     for fn in files:
                         if fn in lm:
                             ret._lm[fn] = self._lm[fn]
                     return ret
                 def filesnotin(self, m2):
                     '''Set of files in this manifest that are not in the other'''
                     files = set(self)
                     files.difference_update(m2)
                     return files
                 @propertycache
                 def _dirs(self):
                     return scmutil.dirs(self)
                 def dirs(self):
                     return self._dirs
                 def hasdir(self, dir):
                     return dir in self._dirs
                 def matches(self, match):
                     '''generate a new manifest filtered by the match argument'''
                     if match.always():
                         return self.copy()
                     files = match.files()
                     if (len(files) < 100 and (match.matchfn == match.exact or
                         (not match.anypats() and util.all(fn in self for fn in files)))):
                         return self.intersectfiles(files)
                     lm = manifestdict('')
                     lm._lm = self._lm.filtercopy(match)
                     return lm
                 def diff(self, m2, clean=False):
                     '''Finds changes between the current manifest and m2.
                     Args:
                       m2: the manifest to which this manifest should be compared.
                       clean: if true, include files unchanged between these manifests
                              with a None value in the returned dictionary.
                     The result is returned as a dict with filename as key and
                     values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the
                     nodeid in the current/other manifest and fl1/fl2 is the flag
                     in the current/other manifest. Where the file does not exist,
                     the nodeid will be None and the flags will be the empty
                     string.
                     '''
                     return self._lm.diff(m2._lm, clean)
                 def setflag(self, key, flag):
                     self._lm[key] = self[key], flag
                 def get(self, key, default=None):
                     try:
                         return self._lm[key][0]
                     except KeyError:
                         return default
                 def flags(self, key, default=''):
                     try:
                         return self._lm[key][1]
                     except KeyError:
                         return default
                 def copy(self):
                     c = manifestdict('')
                     c._lm = self._lm.copy()
                     return c
                 def iteritems(self):
                     return (x[:2] for x in self._lm.iterentries())
                 def text(self):
                     return self._lm.text()
                 def fastdelta(self, base, changes):
                     """Given a base manifest text as an array.array and a list of changes
                     relative to that text, compute a delta that can be used by revlog.
                     """
                     delta = []
                     dstart = None
                     dend = None
                     dline = [""]
                     start = 0
                     # zero copy representation of base as a buffer
                     addbuf = util.buffer(base)
                     # start with a readonly loop that finds the offset of
                     # each line and creates the deltas
                     for f, todelete in changes:
                         # bs will either be the index of the item or the insert point
                         start, end = _msearch(addbuf, f, start)
                         if not todelete:
                             h, fl = self._lm[f]
                             l = "%s\0%s%s\n" % (f, revlog.hex(h), fl)
                         else:
                             if start == end:
                                 # item we want to delete was not found, error out
                                 raise AssertionError(
                                         _("failed to remove %s from manifest") % f)
                             l = ""
                         if dstart is not None and dstart <= start and dend >= start:
                             if dend < end:
                                 dend = end
                             if l:
                                 dline.append(l)
                         else:
                             if dstart is not None:
                                 delta.append([dstart, dend, "".join(dline)])
                             dstart = start
                             dend = end
                             dline = [l]
                     if dstart is not None:
                         delta.append([dstart, dend, "".join(dline)])
                     # apply the delta to the base, and get a delta for addrevision
                     deltatext, arraytext = _addlistdelta(base, delta)
                     return arraytext, deltatext
             def _msearch(m, s, lo=0, hi=None):
                 '''return a tuple (start, end) that says where to find s within m.
                 If the string is found m[start:end] are the line containing
                 that string.  If start == end the string was not found and
                 they indicate the proper sorted insertion point.
                 m should be a buffer or a string
                 s is a string'''
                 def advance(i, c):
                     while i < lenm and m[i] != c:
                         i += 1
                     return i
                 if not s:
                     return (lo, lo)
                 lenm = len(m)
                 if not hi:
                     hi = lenm
                 while lo < hi:
                     mid = (lo + hi) // 2
                     start = mid
                     while start > 0 and m[start - 1] != '\n':
                         start -= 1
                     end = advance(start, '\0')
                     if m[start:end] < s:
                         # we know that after the null there are 40 bytes of sha1
                         # this translates to the bisect lo = mid + 1
                         lo = advance(end + 40, '\n') + 1
                     else:
                         # this translates to the bisect hi = mid
                         hi = start
                 end = advance(lo, '\0')
                 found = m[lo:end]
                 if s == found:
                     # we know that after the null there are 40 bytes of sha1
                     end = advance(end + 40, '\n')
                     return (lo, end + 1)
                 else:
                     return (lo, lo)
             def _checkforbidden(l):
                 """Check filenames for illegal characters."""
                 for f in l:
                     if '\n' in f or '\r' in f:
                         raise error.RevlogError(
                             _("'\\n' and '\\r' disallowed in filenames: %r") % f)
             # apply the changes collected during the bisect loop to our addlist
             # return a delta suitable for addrevision
             def _addlistdelta(addlist, x):
                 # for large addlist arrays, building a new array is cheaper
                 # than repeatedly modifying the existing one
                 currentposition = 0
                 newaddlist = array.array('c')
                 for start, end, content in x:
                     newaddlist += addlist[currentposition:start]
                     if content:
                         newaddlist += array.array('c', content)
                     currentposition = end
                 newaddlist += addlist[currentposition:]
                 deltatext = "".join(struct.pack(">lll", start, end, len(content))
                                + content for start, end, content in x)
                 return deltatext, newaddlist
             def _splittopdir(f):
                 if '/' in f:
                     dir, subpath = f.split('/', 1)
                     return dir + '/', subpath
                 else:
                     return '', f
             class treemanifest(object):
                 def __init__(self, dir='', text=''):
                     self._dir = dir
                     self._dirs = {}
                     # Using _lazymanifest here is a little slower than plain old dicts
                     self._files = {}
                     self._flags = {}
                     lm = _lazymanifest(text)
                     for f, n, fl in lm.iterentries():
                         self[f] = n
                         if fl:
                             self.setflag(f, fl)
                 def _subpath(self, path):
                     return self._dir + path
                 def __len__(self):
                     size = len(self._files)
                     for m in self._dirs.values():
                         size += m.__len__()
                     return size
                 def __str__(self):
                     return '<treemanifest dir=%s>' % self._dir
                 def iteritems(self):
                     for p, n in sorted(self._dirs.items() + self._files.items()):
                         if p in self._files:
                             yield self._subpath(p), n
                         else:
                             for f, sn in n.iteritems():
                                 yield f, sn
                 def iterkeys(self):
                     for p in sorted(self._dirs.keys() + self._files.keys()):
                         if p in self._files:
                             yield self._subpath(p)
                         else:
                             for f in self._dirs[p].iterkeys():
                                 yield f
                 def keys(self):
                     return list(self.iterkeys())
                 def __iter__(self):
                     return self.iterkeys()
                 def __contains__(self, f):
                     if f is None:
                         return False
                     dir, subpath = _splittopdir(f)
                     if dir:
                         if dir not in self._dirs:
                             return False
                         return self._dirs[dir].__contains__(subpath)
                     else:
                         return f in self._files
                 def get(self, f, default=None):
                     dir, subpath = _splittopdir(f)
                     if dir:
                         if dir not in self._dirs:
                             return default
                         return self._dirs[dir].get(subpath, default)
                     else:
                         return self._files.get(f, default)
                 def __getitem__(self, f):
                     dir, subpath = _splittopdir(f)
                     if dir:
                         return self._dirs[dir].__getitem__(subpath)
                     else:
                         return self._files[f]
                 def flags(self, f):
                     dir, subpath = _splittopdir(f)
                     if dir:
                         if dir not in self._dirs:
                             return ''
                         return self._dirs[dir].flags(subpath)
                     else:
                         if f in self._dirs:
                             return ''
                         return self._flags.get(f, '')
                 def find(self, f):
                     dir, subpath = _splittopdir(f)
                     if dir:
                         return self._dirs[dir].find(subpath)
                     else:
                         return self._files[f], self._flags.get(f, '')
                 def __delitem__(self, f):
                     dir, subpath = _splittopdir(f)
                     if dir:
                         self._dirs[dir].__delitem__(subpath)
                         # If the directory is now empty, remove it
                         if not self._dirs[dir]._dirs and not self._dirs[dir]._files:
                             del self._dirs[dir]
                     else:
                         del self._files[f]
                         if f in self._flags:
                             del self._flags[f]
                 def __setitem__(self, f, n):
                     assert n is not None
                     dir, subpath = _splittopdir(f)
                     if dir:
                         if dir not in self._dirs:
                             self._dirs[dir] = treemanifest(self._subpath(dir))
                         self._dirs[dir].__setitem__(subpath, n)
                     else:
                         self._files[f] = n
                 def setflag(self, f, flags):
                     """Set the flags (symlink, executable) for path f."""
                     dir, subpath = _splittopdir(f)
                     if dir:
                         if dir not in self._dirs:
                             self._dirs[dir] = treemanifest(self._subpath(dir))
                         self._dirs[dir].setflag(subpath, flags)
                     else:
                         self._flags[f] = flags
                 def copy(self):
                     copy = treemanifest(self._dir)
                     for d in self._dirs:
                         copy._dirs[d] = self._dirs[d].copy()
                     copy._files = dict.copy(self._files)
                     copy._flags = dict.copy(self._flags)
                     return copy
                 def intersectfiles(self, files):
                     '''make a new treemanifest with the intersection of self with files
                     The algorithm assumes that files is much smaller than self.'''
                     ret = treemanifest()
                     for fn in files:
                         if fn in self:
                             ret[fn] = self[fn]
                             flags = self.flags(fn)
                             if flags:
                                 ret.setflag(fn, flags)
                     return ret
                 def filesnotin(self, m2):
                     '''Set of files in this manifest that are not in the other'''
-                    files = set(self.iterkeys())
+                    files = set()
-                    files.difference_update(m2.iterkeys())
+                    def _filesnotin(t1, t2):
+                        for d, m1 in t1._dirs.iteritems():
+                            if d in t2._dirs:
+                                m2 = t2._dirs[d]
+                                _filesnotin(m1, m2)
+                            else:
+                                files.update(m1.iterkeys())
+                        for fn in t1._files.iterkeys():
+                            if fn not in t2._files:
+                                files.add(t1._subpath(fn))
+                    _filesnotin(self, m2)
                     return files
                 @propertycache
                 def _alldirs(self):
                     return scmutil.dirs(self)
                 def dirs(self):
                     return self._alldirs
                 def hasdir(self, dir):
                     return dir in self._alldirs
                 def matches(self, match):
                     '''generate a new manifest filtered by the match argument'''
                     if match.always():
                         return self.copy()
                     files = match.files()
                     if (match.matchfn == match.exact or
                         (not match.anypats() and util.all(fn in self for fn in files))):
                         return self.intersectfiles(files)
                     m = self.copy()
                     for fn in m.keys():
                         if not match(fn):
                             del m[fn]
                     return m
                 def diff(self, m2, clean=False):
                     '''Finds changes between the current manifest and m2.
                     Args:
                       m2: the manifest to which this manifest should be compared.
                       clean: if true, include files unchanged between these manifests
                              with a None value in the returned dictionary.
                     The result is returned as a dict with filename as key and
                     values of the form ((n1,fl1),(n2,fl2)), where n1/n2 is the
                     nodeid in the current/other manifest and fl1/fl2 is the flag
                     in the current/other manifest. Where the file does not exist,
                     the nodeid will be None and the flags will be the empty
                     string.
                     '''
                     result = {}
                     emptytree = treemanifest()
                     def _diff(t1, t2):
                         for d, m1 in t1._dirs.iteritems():
                             m2 = t2._dirs.get(d, emptytree)
                             _diff(m1, m2)
                         for d, m2 in t2._dirs.iteritems():
                             if d not in t1._dirs:
                                 _diff(emptytree, m2)
                         for fn, n1 in t1._files.iteritems():
                             fl1 = t1._flags.get(fn, '')
                             n2 = t2._files.get(fn, None)
                             fl2 = t2._flags.get(fn, '')
                             if n1 != n2 or fl1 != fl2:
                                 result[t1._subpath(fn)] = ((n1, fl1), (n2, fl2))
                             elif clean:
                                 result[t1._subpath(fn)] = None
                         for fn, n2 in t2._files.iteritems():
                             if fn not in t1._files:
                                 fl2 = t2._flags.get(fn, '')
                                 result[t2._subpath(fn)] = ((None, ''), (n2, fl2))
                     _diff(self, m2)
                     return result
                 def text(self):
                     """Get the full data of this manifest as a bytestring."""
                     fl = self.keys()
                     _checkforbidden(fl)
                     hex, flags = revlog.hex, self.flags
                     # if this is changed to support newlines in filenames,
                     # be sure to check the templates/ dir again (especially *-raw.tmpl)
                     return ''.join("%s\0%s%s\n" % (f, hex(self[f]), flags(f)) for f in fl)
             class manifest(revlog.revlog):
                 def __init__(self, opener):
                     # During normal operations, we expect to deal with not more than four
                     # revs at a time (such as during commit --amend). When rebasing large
                     # stacks of commits, the number can go up, hence the config knob below.
                     cachesize = 4
                     usetreemanifest = False
                     opts = getattr(opener, 'options', None)
                     if opts is not None:
                         cachesize = opts.get('manifestcachesize', cachesize)
                         usetreemanifest = opts.get('usetreemanifest', usetreemanifest)
                     self._mancache = util.lrucachedict(cachesize)
                     revlog.revlog.__init__(self, opener, "00manifest.i")
                     self._usetreemanifest = usetreemanifest
                 def _newmanifest(self, data=''):
                     if self._usetreemanifest:
                         return treemanifest('', data)
                     return manifestdict(data)
                 def readdelta(self, node):
                     r = self.rev(node)
                     d = mdiff.patchtext(self.revdiff(self.deltaparent(r), r))
                     return self._newmanifest(d)
                 def readfast(self, node):
                     '''use the faster of readdelta or read'''
                     r = self.rev(node)
                     deltaparent = self.deltaparent(r)
                     if deltaparent != revlog.nullrev and deltaparent in self.parentrevs(r):
                         return self.readdelta(node)
                     return self.read(node)
                 def read(self, node):
                     if node == revlog.nullid:
                         return self._newmanifest() # don't upset local cache
                     if node in self._mancache:
                         return self._mancache[node][0]
                     text = self.revision(node)
                     arraytext = array.array('c', text)
                     m = self._newmanifest(text)
                     self._mancache[node] = (m, arraytext)
                     return m
                 def find(self, node, f):
                     '''look up entry for a single file efficiently.
                     return (node, flags) pair if found, (None, None) if not.'''
                     m = self.read(node)
                     try:
                         return m.find(f)
                     except KeyError:
                         return None, None
                 def add(self, m, transaction, link, p1, p2, added, removed):
                     if p1 in self._mancache and not self._usetreemanifest:
                         # If our first parent is in the manifest cache, we can
                         # compute a delta here using properties we know about the
                         # manifest up-front, which may save time later for the
                         # revlog layer.
                         _checkforbidden(added)
                         # combine the changed lists into one list for sorting
                         work = [(x, False) for x in added]
                         work.extend((x, True) for x in removed)
                         # this could use heapq.merge() (from Python 2.6+) or equivalent
                         # since the lists are already sorted
                         work.sort()
                         arraytext, deltatext = m.fastdelta(self._mancache[p1][1], work)
                         cachedelta = self.rev(p1), deltatext
                         text = util.buffer(arraytext)
                     else:
                         # The first parent manifest isn't already loaded, so we'll
                         # just encode a fulltext of the manifest and pass that
                         # through to the revlog layer, and let it handle the delta
                         # process.
                         text = m.text()
                         arraytext = array.array('c', text)
                         cachedelta = None
                     n = self.addrevision(text, transaction, link, p1, p2, cachedelta)
                     self._mancache[n] = (m, arraytext)
                     return n