upstream/mercurial-mirror Commit - r31705:5eb4d206

1

# tags.py - read tag info from local repository

1

# tags.py - read tag info from local repository

2

#

2

#

3

4

5

#

5

#

6

# This software may be used and distributed according to the terms of the

6

# This software may be used and distributed according to the terms of the

7

# GNU General Public License version 2 or any later version.

7

# GNU General Public License version 2 or any later version.

8

9

# Currently this module only deals with reading and caching tags.

9

# Currently this module only deals with reading and caching tags.

10

# Eventually, it could take care of updating (adding/removing/moving)

10

# Eventually, it could take care of updating (adding/removing/moving)

11

# tags too.

11

# tags too.

12

13

from __future__ import absolute_import

13

from __future__ import absolute_import

14

15

import errno

15

import errno

16

17

from .node import (

17

from .node import (

18

bin,

18

bin,

19

hex,

19

hex,

20

nullid,

20

nullid,

21

short,

21

short,

22

)

22

)

23

from .i18n import _

23

from .i18n import _

24

from . import (

24

from . import (

25

encoding,

25

encoding,

26

error,

26

error,

27

match as matchmod,

27

match as matchmod,

28

scmutil,

28

scmutil,

29

util,

29

util,

30

)

30

)

31

32

# Tags computation can be expensive and caches exist to make it fast in

32

# Tags computation can be expensive and caches exist to make it fast in

33

# the common case.

33

# the common case.

34

#

34

#

35

# The "hgtagsfnodes1" cache file caches the .hgtags filenode values for

35

# The "hgtagsfnodes1" cache file caches the .hgtags filenode values for

36

# each revision in the repository. The file is effectively an array of

36

# each revision in the repository. The file is effectively an array of

37

# fixed length records. Read the docs for "hgtagsfnodescache" for technical

37

# fixed length records. Read the docs for "hgtagsfnodescache" for technical

38

# details.

38

# details.

39

#

39

#

40

# The .hgtags filenode cache grows in proportion to the length of the

40

# The .hgtags filenode cache grows in proportion to the length of the

41

# changelog. The file is truncated when the # changelog is stripped.

41

# changelog. The file is truncated when the # changelog is stripped.

42

#

42

#

43

# The purpose of the filenode cache is to avoid the most expensive part

43

# The purpose of the filenode cache is to avoid the most expensive part

44

# of finding global tags, which is looking up the .hgtags filenode in the

44

# of finding global tags, which is looking up the .hgtags filenode in the

45

# manifest for each head. This can take dozens or over 100ms for

45

# manifest for each head. This can take dozens or over 100ms for

46

# repositories with very large manifests. Multiplied by dozens or even

46

# repositories with very large manifests. Multiplied by dozens or even

47

# hundreds of heads and there is a significant performance concern.

47

# hundreds of heads and there is a significant performance concern.

48

#

48

#

49

# There also exist a separate cache file for each repository filter.

49

# There also exist a separate cache file for each repository filter.

50

# These "tags-*" files store information about the history of tags.

50

# These "tags-*" files store information about the history of tags.

51

#

51

#

52

# The tags cache files consists of a cache validation line followed by

52

# The tags cache files consists of a cache validation line followed by

53

# a history of tags.

53

# a history of tags.

54

#

54

#

55

# The cache validation line has the format:

55

# The cache validation line has the format:

56

#

56

#

57

# <tiprev> <tipnode> [<filteredhash>]

57

# <tiprev> <tipnode> [<filteredhash>]

58

#

58

#

59

# <tiprev> is an integer revision and <tipnode> is a 40 character hex

59

# <tiprev> is an integer revision and <tipnode> is a 40 character hex

60

# node for that changeset. These redundantly identify the repository

60

# node for that changeset. These redundantly identify the repository

61

# tip from the time the cache was written. In addition, <filteredhash>,

61

# tip from the time the cache was written. In addition, <filteredhash>,

62

# if present, is a 40 character hex hash of the contents of the filtered

62

# if present, is a 40 character hex hash of the contents of the filtered

63

# revisions for this filter. If the set of filtered revs changes, the

63

# revisions for this filter. If the set of filtered revs changes, the

64

# hash will change and invalidate the cache.

64

# hash will change and invalidate the cache.

65

#

65

#

66

# The history part of the tags cache consists of lines of the form:

66

# The history part of the tags cache consists of lines of the form:

67

#

67

#

68

# <node> <tag>

68

# <node> <tag>

69

#

69

#

70

# (This format is identical to that of .hgtags files.)

70

# (This format is identical to that of .hgtags files.)

71

#

71

#

72

# <tag> is the tag name and <node> is the 40 character hex changeset

72

# <tag> is the tag name and <node> is the 40 character hex changeset

73

# the tag is associated with.

73

# the tag is associated with.

74

#

74

#

75

# Tags are written sorted by tag name.

75

# Tags are written sorted by tag name.

76

#

76

#

77

# Tags associated with multiple changesets have an entry for each changeset.

77

# Tags associated with multiple changesets have an entry for each changeset.

78

# The most recent changeset (in terms of revlog ordering for the head

78

# The most recent changeset (in terms of revlog ordering for the head

79

# setting it) for each tag is last.

79

# setting it) for each tag is last.

80

81

def findglobaltags(ui, repo, alltags, tagtypes):

81

def findglobaltags(ui, repo, alltags, tagtypes):

82

'''Find global tags in a repo.

82

'''Find global tags in a repo.

83

84

"alltags" maps tag name to (node, hist) 2-tuples.

84

"alltags" maps tag name to (node, hist) 2-tuples.

85

86

"tagtypes" maps tag name to tag type. Global tags always have the

86

"tagtypes" maps tag name to tag type. Global tags always have the

87

"global" tag type.

87

"global" tag type.

88

89

The "alltags" and "tagtypes" dicts are updated in place. Empty dicts

89

The "alltags" and "tagtypes" dicts are updated in place. Empty dicts

90

should be passed in.

90

should be passed in.

91

92

The tags cache is read and updated as a side-effect of calling.

92

The tags cache is read and updated as a side-effect of calling.

93

'''

93

'''

94

# This is so we can be lazy and assume alltags contains only global

94

# This is so we can be lazy and assume alltags contains only global

95

# tags when we pass it to _writetagcache().

95

# tags when we pass it to _writetagcache().

96

assert len(alltags) == len(tagtypes) == 0, \

96

assert len(alltags) == len(tagtypes) == 0, \

97

"findglobaltags() should be called first"

97

"findglobaltags() should be called first"

98

99

(heads, tagfnode, valid, cachetags, shouldwrite) = _readtagcache(ui, repo)

99

(heads, tagfnode, valid, cachetags, shouldwrite) = _readtagcache(ui, repo)

100

if cachetags is not None:

100

if cachetags is not None:

101

assert not shouldwrite

101

assert not shouldwrite

102

# XXX is this really 100% correct? are there oddball special

102

# XXX is this really 100% correct? are there oddball special

103

# cases where a global tag should outrank a local tag but won't,

103

# cases where a global tag should outrank a local tag but won't,

104

# because cachetags does not contain rank info?

104

# because cachetags does not contain rank info?

105

_updatetags(cachetags, 'global', alltags, tagtypes)

105

_updatetags(cachetags, 'global', alltags, tagtypes)

106

return

106

return

107

108

seen = set() # set of fnode

108

seen = set() # set of fnode

109

fctx = None

109

fctx = None

110

for head in reversed(heads): # oldest to newest

110

for head in reversed(heads): # oldest to newest

111

assert head in repo.changelog.nodemap, \

111

assert head in repo.changelog.nodemap, \

112

"tag cache returned bogus head %s" % short(head)

112

"tag cache returned bogus head %s" % short(head)

113

114

fnode = tagfnode.get(head)

114

fnode = tagfnode.get(head)

115

if fnode and fnode not in seen:

115

if fnode and fnode not in seen:

116

seen.add(fnode)

116

seen.add(fnode)

117

if not fctx:

117

if not fctx:

118

fctx = repo.filectx('.hgtags', fileid=fnode)

118

fctx = repo.filectx('.hgtags', fileid=fnode)

119

else:

119

else:

120

fctx = fctx.filectx(fnode)

120

fctx = fctx.filectx(fnode)

121

122

filetags = _readtags(ui, repo, fctx.data().splitlines(), fctx)

122

filetags = _readtags(ui, repo, fctx.data().splitlines(), fctx)

123

_updatetags(filetags, 'global', alltags, tagtypes)

123

_updatetags(filetags, 'global', alltags, tagtypes)

124

125

# and update the cache (if necessary)

125

# and update the cache (if necessary)

126

if shouldwrite:

126

if shouldwrite:

127

_writetagcache(ui, repo, valid, alltags)

127

_writetagcache(ui, repo, valid, alltags)

128

129

def readlocaltags(ui, repo, alltags, tagtypes):

129

def readlocaltags(ui, repo, alltags, tagtypes):

130

'''Read local tags in repo. Update alltags and tagtypes.'''

130

'''Read local tags in repo. Update alltags and tagtypes.'''

131

try:

131

try:

132

data = repo.vfs.read("localtags")

132

data = repo.vfs.read("localtags")

133

except IOError as inst:

133

except IOError as inst:

134

if inst.errno != errno.ENOENT:

134

if inst.errno != errno.ENOENT:

135

raise

135

raise

136

return

136

return

137

138

# localtags is in the local encoding; re-encode to UTF-8 on

138

# localtags is in the local encoding; re-encode to UTF-8 on

139

# input for consistency with the rest of this module.

139

# input for consistency with the rest of this module.

140

filetags = _readtags(

140

filetags = _readtags(

141

ui, repo, data.splitlines(), "localtags",

141

ui, repo, data.splitlines(), "localtags",

142

recode=encoding.fromlocal)

142

recode=encoding.fromlocal)

143

144

# remove tags pointing to invalid nodes

144

# remove tags pointing to invalid nodes

145

cl = repo.changelog

145

cl = repo.changelog

146

for t in filetags.keys():

146

for t in filetags.keys():

147

try:

147

try:

148

cl.rev(filetags[t][0])

148

cl.rev(filetags[t][0])

149

except (LookupError, ValueError):

149

except (LookupError, ValueError):

150

del filetags[t]

150

del filetags[t]

151

152

_updatetags(filetags, "local", alltags, tagtypes)

152

_updatetags(filetags, "local", alltags, tagtypes)

153

154

def _readtaghist(ui, repo, lines, fn, recode=None, calcnodelines=False):

154

def _readtaghist(ui, repo, lines, fn, recode=None, calcnodelines=False):

155

'''Read tag definitions from a file (or any source of lines).

155

'''Read tag definitions from a file (or any source of lines).

156

157

This function returns two sortdicts with similar information:

157

This function returns two sortdicts with similar information:

158

159

- the first dict, bintaghist, contains the tag information as expected by

159

- the first dict, bintaghist, contains the tag information as expected by

160

the _readtags function, i.e. a mapping from tag name to (node, hist):

160

the _readtags function, i.e. a mapping from tag name to (node, hist):

161

- node is the node id from the last line read for that name,

161

- node is the node id from the last line read for that name,

162

- hist is the list of node ids previously associated with it (in file

162

- hist is the list of node ids previously associated with it (in file

163

order). All node ids are binary, not hex.

163

order). All node ids are binary, not hex.

164

165

- the second dict, hextaglines, is a mapping from tag name to a list of

165

- the second dict, hextaglines, is a mapping from tag name to a list of

166

[hexnode, line number] pairs, ordered from the oldest to the newest node.

166

[hexnode, line number] pairs, ordered from the oldest to the newest node.

167

168

When calcnodelines is False the hextaglines dict is not calculated (an

168

When calcnodelines is False the hextaglines dict is not calculated (an

169

empty dict is returned). This is done to improve this function's

169

empty dict is returned). This is done to improve this function's

170

performance in cases where the line numbers are not needed.

170

performance in cases where the line numbers are not needed.

171

'''

171

'''

172

173

bintaghist = util.sortdict()

173

bintaghist = util.sortdict()

174

hextaglines = util.sortdict()

174

hextaglines = util.sortdict()

175

count = 0

175

count = 0

176

177

def dbg(msg):

177

def dbg(msg):

178

ui.debug("%s, line %s: %s\n" % (fn, count, msg))

178

ui.debug("%s, line %s: %s\n" % (fn, count, msg))

179

180

for nline, line in enumerate(lines):

180

for nline, line in enumerate(lines):

181

count += 1

181

count += 1

182

if not line:

182

if not line:

183

continue

183

continue

184

try:

184

try:

185

(nodehex, name) = line.split(" ", 1)

185

(nodehex, name) = line.split(" ", 1)

186

except ValueError:

186

except ValueError:

187

dbg("cannot parse entry")

187

dbg("cannot parse entry")

188

continue

188

continue

189

name = name.strip()

189

name = name.strip()

190

if recode:

190

if recode:

191

name = recode(name)

191

name = recode(name)

192

try:

192

try:

193

nodebin = bin(nodehex)

193

nodebin = bin(nodehex)

194

except TypeError:

194

except TypeError:

195

dbg("node '%s' is not well formed" % nodehex)

195

dbg("node '%s' is not well formed" % nodehex)

196

continue

196

continue

197

198

# update filetags

198

# update filetags

199

if calcnodelines:

199

if calcnodelines:

200

# map tag name to a list of line numbers

200

# map tag name to a list of line numbers

201

if name not in hextaglines:

201

if name not in hextaglines:

202

hextaglines[name] = []

202

hextaglines[name] = []

203

hextaglines[name].append([nodehex, nline])

203

hextaglines[name].append([nodehex, nline])

204

continue

204

continue

205

# map tag name to (node, hist)

205

# map tag name to (node, hist)

206

if name not in bintaghist:

206

if name not in bintaghist:

207

bintaghist[name] = []

207

bintaghist[name] = []

208

bintaghist[name].append(nodebin)

208

bintaghist[name].append(nodebin)

209

return bintaghist, hextaglines

209

return bintaghist, hextaglines

210

211

def _readtags(ui, repo, lines, fn, recode=None, calcnodelines=False):

211

def _readtags(ui, repo, lines, fn, recode=None, calcnodelines=False):

212

'''Read tag definitions from a file (or any source of lines).

212

'''Read tag definitions from a file (or any source of lines).

213

214

Returns a mapping from tag name to (node, hist).

214

Returns a mapping from tag name to (node, hist).

215

216

"node" is the node id from the last line read for that name. "hist"

216

"node" is the node id from the last line read for that name. "hist"

217

is the list of node ids previously associated with it (in file order).

217

is the list of node ids previously associated with it (in file order).

218

All node ids are binary, not hex.

218

All node ids are binary, not hex.

219

'''

219

'''

220

filetags, nodelines = _readtaghist(ui, repo, lines, fn, recode=recode,

220

filetags, nodelines = _readtaghist(ui, repo, lines, fn, recode=recode,

221

calcnodelines=calcnodelines)

221

calcnodelines=calcnodelines)

222

# util.sortdict().__setitem__ is much slower at replacing then inserting

222

# util.sortdict().__setitem__ is much slower at replacing then inserting

223

# new entries. The difference can matter if there are thousands of tags.

223

# new entries. The difference can matter if there are thousands of tags.

224

# Create a new sortdict to avoid the performance penalty.

224

# Create a new sortdict to avoid the performance penalty.

225

newtags = util.sortdict()

225

newtags = util.sortdict()

226

for tag, taghist in filetags.items():

226

for tag, taghist in filetags.items():

227

newtags[tag] = (taghist[-1], taghist[:-1])

227

newtags[tag] = (taghist[-1], taghist[:-1])

228

return newtags

228

return newtags

229

230

def _updatetags(filetags, tagtype, alltags, tagtypes):

230

def _updatetags(filetags, tagtype, alltags, tagtypes):

231

'''Incorporate the tag info read from one file into the two

231

'''Incorporate the tag info read from one file into the two

232

dictionaries, alltags and tagtypes, that contain all tag

232

dictionaries, alltags and tagtypes, that contain all tag

233

info (global across all heads plus local).'''

233

info (global across all heads plus local).'''

234

235

for name, nodehist in filetags.iteritems():

235

for name, nodehist in filetags.iteritems():

236

if name not in alltags:

236

if name not in alltags:

237

alltags[name] = nodehist

237

alltags[name] = nodehist

238

tagtypes[name] = tagtype

238

tagtypes[name] = tagtype

239

continue

239

continue

240

241

# we prefer alltags[name] if:

241

# we prefer alltags[name] if:

242

# it supersedes us OR

242

# it supersedes us OR

243

# mutual supersedes and it has a higher rank

243

# mutual supersedes and it has a higher rank

244

# otherwise we win because we're tip-most

244

# otherwise we win because we're tip-most

245

anode, ahist = nodehist

245

anode, ahist = nodehist

246

bnode, bhist = alltags[name]

246

bnode, bhist = alltags[name]

247

if (bnode != anode and anode in bhist and

247

if (bnode != anode and anode in bhist and

248

(bnode not in ahist or len(bhist) > len(ahist))):

248

(bnode not in ahist or len(bhist) > len(ahist))):

249

anode = bnode

249

anode = bnode

250

else:

250

else:

251

tagtypes[name] = tagtype

251

tagtypes[name] = tagtype

252

ahist.extend([n for n in bhist if n not in ahist])

252

ahist.extend([n for n in bhist if n not in ahist])

253

alltags[name] = anode, ahist

253

alltags[name] = anode, ahist

254

255

def _filename(repo):

255

def _filename(repo):

256

"""name of a tagcache file for a given repo or repoview"""

256

"""name of a tagcache file for a given repo or repoview"""

257

filename = 'cache/tags2'

257

filename = 'cache/tags2'

258

if repo.filtername:

258

if repo.filtername:

259

filename = '%s-%s' % (filename, repo.filtername)

259

filename = '%s-%s' % (filename, repo.filtername)

260

return filename

260

return filename

261

262

def _readtagcache(ui, repo):

262

def _readtagcache(ui, repo):

263

'''Read the tag cache.

263

'''Read the tag cache.

264

265

Returns a tuple (heads, fnodes, validinfo, cachetags, shouldwrite).

265

Returns a tuple (heads, fnodes, validinfo, cachetags, shouldwrite).

266

267

If the cache is completely up-to-date, "cachetags" is a dict of the

267

If the cache is completely up-to-date, "cachetags" is a dict of the

268

form returned by _readtags() and "heads", "fnodes", and "validinfo" are

268

form returned by _readtags() and "heads", "fnodes", and "validinfo" are

269

None and "shouldwrite" is False.

269

None and "shouldwrite" is False.

270

271

If the cache is not up to date, "cachetags" is None. "heads" is a list

271

If the cache is not up to date, "cachetags" is None. "heads" is a list

272

of all heads currently in the repository, ordered from tip to oldest.

272

of all heads currently in the repository, ordered from tip to oldest.

273

"validinfo" is a tuple describing cache validation info. This is used

273

"validinfo" is a tuple describing cache validation info. This is used

274

when writing the tags cache. "fnodes" is a mapping from head to .hgtags

274

when writing the tags cache. "fnodes" is a mapping from head to .hgtags

275

filenode. "shouldwrite" is True.

275

filenode. "shouldwrite" is True.

276

277

If the cache is not up to date, the caller is responsible for reading tag

277

If the cache is not up to date, the caller is responsible for reading tag

278

info from each returned head. (See findglobaltags().)

278

info from each returned head. (See findglobaltags().)

279

'''

279

'''

280

try:

280

try:

281

cachefile = repo.vfs(_filename(repo), 'r')

281

cachefile = repo.vfs(_filename(repo), 'r')

282

# force reading the file for static-http

282

# force reading the file for static-http

283

cachelines = iter(cachefile)

283

cachelines = iter(cachefile)

284

except IOError:

284

except IOError:

285

cachefile = None

285

cachefile = None

286

287

cacherev = None

287

cacherev = None

288

cachenode = None

288

cachenode = None

289

cachehash = None

289

cachehash = None

290

if cachefile:

290

if cachefile:

291

try:

291

try:

292

validline = next(cachelines)

292

validline = next(cachelines)

293

validline = validline.split()

293

validline = validline.split()

294

cacherev = int(validline[0])

294

cacherev = int(validline[0])

295

cachenode = bin(validline[1])

295

cachenode = bin(validline[1])

296

if len(validline) > 2:

296

if len(validline) > 2:

297

cachehash = bin(validline[2])

297

cachehash = bin(validline[2])

298

except Exception:

298

except Exception:

299

# corruption of the cache, just recompute it.

299

# corruption of the cache, just recompute it.

300

pass

300

pass

301

302

tipnode = repo.changelog.tip()

302

tipnode = repo.changelog.tip()

303

tiprev = len(repo.changelog) - 1

303

tiprev = len(repo.changelog) - 1

304

305

# Case 1 (common): tip is the same, so nothing has changed.

305

# Case 1 (common): tip is the same, so nothing has changed.

306

# (Unchanged tip trivially means no changesets have been added.

306

# (Unchanged tip trivially means no changesets have been added.

307

# But, thanks to localrepository.destroyed(), it also means none

307

# But, thanks to localrepository.destroyed(), it also means none

308

# have been destroyed by strip or rollback.)

308

# have been destroyed by strip or rollback.)

309

if (cacherev == tiprev

309

if (cacherev == tiprev

310

and cachenode == tipnode

310

and cachenode == tipnode

311

and cachehash == scmutil.filteredhash(repo, tiprev)):

311

and cachehash == scmutil.filteredhash(repo, tiprev)):

312

tags = _readtags(ui, repo, cachelines, cachefile.name)

312

tags = _readtags(ui, repo, cachelines, cachefile.name)

313

cachefile.close()

313

cachefile.close()

314

return (None, None, None, tags, False)

314

return (None, None, None, tags, False)

315

if cachefile:

315

if cachefile:

316

cachefile.close() # ignore rest of file

316

cachefile.close() # ignore rest of file

317

318

valid = (tiprev, tipnode, scmutil.filteredhash(repo, tiprev))

318

valid = (tiprev, tipnode, scmutil.filteredhash(repo, tiprev))

319

320

repoheads = repo.heads()

320

repoheads = repo.heads()

321

# Case 2 (uncommon): empty repo; get out quickly and don't bother

321

# Case 2 (uncommon): empty repo; get out quickly and don't bother

322

# writing an empty cache.

322

# writing an empty cache.

323

if repoheads == [nullid]:

323

if repoheads == [nullid]:

324

return ([], {}, valid, {}, False)

324

return ([], {}, valid, {}, False)

325

326

# Case 3 (uncommon): cache file missing or empty.

326

# Case 3 (uncommon): cache file missing or empty.

327

328

# Case 4 (uncommon): tip rev decreased. This should only happen

328

# Case 4 (uncommon): tip rev decreased. This should only happen

329

# when we're called from localrepository.destroyed(). Refresh the

329

# when we're called from localrepository.destroyed(). Refresh the

330

# cache so future invocations will not see disappeared heads in the

330

# cache so future invocations will not see disappeared heads in the

331

# cache.

331

# cache.

332

333

# Case 5 (common): tip has changed, so we've added/replaced heads.

333

# Case 5 (common): tip has changed, so we've added/replaced heads.

334

335

# As it happens, the code to handle cases 3, 4, 5 is the same.

335

# As it happens, the code to handle cases 3, 4, 5 is the same.

336

337

# N.B. in case 4 (nodes destroyed), "new head" really means "newly

337

# N.B. in case 4 (nodes destroyed), "new head" really means "newly

338

# exposed".

338

# exposed".

339

if not len(repo.file('.hgtags')):

339

if not len(repo.file('.hgtags')):

340

# No tags have ever been committed, so we can avoid a

340

# No tags have ever been committed, so we can avoid a

341

# potentially expensive search.

341

# potentially expensive search.

342

return ([], {}, valid, None, True)

342

return ([], {}, valid, None, True)

343

344

starttime = util.timer()

345

344

346

# Now we have to lookup the .hgtags filenode for every new head.

345

# Now we have to lookup the .hgtags filenode for every new head.

347

# This is the most expensive part of finding tags, so performance

346

# This is the most expensive part of finding tags, so performance

348

# depends primarily on the size of newheads. Worst case: no cache

347

# depends primarily on the size of newheads. Worst case: no cache

349

# file, so newheads == repoheads.

348

# file, so newheads == repoheads.

349

cachefnode = _getfnodes(ui, repo, repoheads)

350

351

# Caller has to iterate over all heads, but can use the filenodes in

352

# cachefnode to get to each .hgtags revision quickly.

353

return (repoheads, cachefnode, valid, None, True)

354

355

def _getfnodes(ui, repo, nodes):

356

"""return .hgtags fnodes for a list of changeset nodes

357

358

Return value is a {node: fnode} mapping. There will be no entry for nodes

359

without a '.hgtags' file.

360

"""

361

starttime = util.timer()

350

fnodescache = hgtagsfnodescache(repo.unfiltered())

362

fnodescache = hgtagsfnodescache(repo.unfiltered())

351

cachefnode = {}

363

cachefnode = {}

352

for head in reversed(~~repohead~~s):

364

for head in reversed(nodes):

353

fnode = fnodescache.getfnode(head)

365

fnode = fnodescache.getfnode(head)

354

if fnode != nullid:

366

if fnode != nullid:

355

cachefnode[head] = fnode

367

cachefnode[head] = fnode

356

368

357

fnodescache.write()

369

fnodescache.write()

358

370

359

duration = util.timer() - starttime

371

duration = util.timer() - starttime

360

ui.log('tagscache',

372

ui.log('tagscache',

361

'%d/%d cache hits/lookups in %0.4f '

373

'%d/%d cache hits/lookups in %0.4f '

362

'seconds\n',

374

'seconds\n',

363

fnodescache.hitcount, fnodescache.lookupcount, duration)

375

fnodescache.hitcount, fnodescache.lookupcount, duration)

364

376

return cachefnode

365

# Caller has to iterate over all heads, but can use the filenodes in

366

# cachefnode to get to each .hgtags revision quickly.

367

return (repoheads, cachefnode, valid, None, True)

368

377

369

def _writetagcache(ui, repo, valid, cachetags):

378

def _writetagcache(ui, repo, valid, cachetags):

370

filename = _filename(repo)

379

filename = _filename(repo)

371

try:

380

try:

372

cachefile = repo.vfs(filename, 'w', atomictemp=True)

381

cachefile = repo.vfs(filename, 'w', atomictemp=True)

373

except (OSError, IOError):

382

except (OSError, IOError):

374

return

383

return

375

384

376

ui.log('tagscache', 'writing .hg/%s with %d tags\n',

385

ui.log('tagscache', 'writing .hg/%s with %d tags\n',

377

filename, len(cachetags))

386

filename, len(cachetags))

378

387

379

if valid[2]:

388

if valid[2]:

380

cachefile.write('%d %s %s\n' % (valid[0], hex(valid[1]), hex(valid[2])))

389

cachefile.write('%d %s %s\n' % (valid[0], hex(valid[1]), hex(valid[2])))

381

else:

390

else:

382

cachefile.write('%d %s\n' % (valid[0], hex(valid[1])))

391

cachefile.write('%d %s\n' % (valid[0], hex(valid[1])))

383

392

384

# Tag names in the cache are in UTF-8 -- which is the whole reason

393

# Tag names in the cache are in UTF-8 -- which is the whole reason

385

# we keep them in UTF-8 throughout this module. If we converted

394

# we keep them in UTF-8 throughout this module. If we converted

386

# them local encoding on input, we would lose info writing them to

395

# them local encoding on input, we would lose info writing them to

387

# the cache.

396

# the cache.

388

for (name, (node, hist)) in sorted(cachetags.iteritems()):

397

for (name, (node, hist)) in sorted(cachetags.iteritems()):

389

for n in hist:

398

for n in hist:

390

cachefile.write("%s %s\n" % (hex(n), name))

399

cachefile.write("%s %s\n" % (hex(n), name))

391

cachefile.write("%s %s\n" % (hex(node), name))

400

cachefile.write("%s %s\n" % (hex(node), name))

392

401

393

try:

402

try:

394

cachefile.close()

403

cachefile.close()

395

except (OSError, IOError):

404

except (OSError, IOError):

396

pass

405

pass

397

406

398

def tag(repo, names, node, message, local, user, date, editor=False):

407

def tag(repo, names, node, message, local, user, date, editor=False):

399

'''tag a revision with one or more symbolic names.

408

'''tag a revision with one or more symbolic names.

400

409

401

names is a list of strings or, when adding a single tag, names may be a

410

names is a list of strings or, when adding a single tag, names may be a

402

string.

411

string.

403

412

404

if local is True, the tags are stored in a per-repository file.

413

if local is True, the tags are stored in a per-repository file.

405

otherwise, they are stored in the .hgtags file, and a new

414

otherwise, they are stored in the .hgtags file, and a new

406

changeset is committed with the change.

415

changeset is committed with the change.

407

416

408

keyword arguments:

417

keyword arguments:

409

418

410

local: whether to store tags in non-version-controlled file

419

local: whether to store tags in non-version-controlled file

411

(default False)

420

(default False)

412

421

413

message: commit message to use if committing

422

message: commit message to use if committing

414

423

415

user: name of user to use if committing

424

user: name of user to use if committing

416

425

417

date: date tuple to use if committing'''

426

date: date tuple to use if committing'''

418

427

419

if not local:

428

if not local:

420

m = matchmod.exact(repo.root, '', ['.hgtags'])

429

m = matchmod.exact(repo.root, '', ['.hgtags'])

421

if any(repo.status(match=m, unknown=True, ignored=True)):

430

if any(repo.status(match=m, unknown=True, ignored=True)):

422

raise error.Abort(_('working copy of .hgtags is changed'),

431

raise error.Abort(_('working copy of .hgtags is changed'),

423

hint=_('please commit .hgtags manually'))

432

hint=_('please commit .hgtags manually'))

424

433

425

repo.tags() # instantiate the cache

434

repo.tags() # instantiate the cache

426

_tag(repo.unfiltered(), names, node, message, local, user, date,

435

_tag(repo.unfiltered(), names, node, message, local, user, date,

427

editor=editor)

436

editor=editor)

428

437

429

def _tag(repo, names, node, message, local, user, date, extra=None,

438

def _tag(repo, names, node, message, local, user, date, extra=None,

430

editor=False):

439

editor=False):

431

if isinstance(names, str):

440

if isinstance(names, str):

432

names = (names,)

441

names = (names,)

433

442

434

branches = repo.branchmap()

443

branches = repo.branchmap()

435

for name in names:

444

for name in names:

436

repo.hook('pretag', throw=True, node=hex(node), tag=name,

445

repo.hook('pretag', throw=True, node=hex(node), tag=name,

437

local=local)

446

local=local)

438

if name in branches:

447

if name in branches:

439

repo.ui.warn(_("warning: tag %s conflicts with existing"

448

repo.ui.warn(_("warning: tag %s conflicts with existing"

440

" branch name\n") % name)

449

" branch name\n") % name)

441

450

442

def writetags(fp, names, munge, prevtags):

451

def writetags(fp, names, munge, prevtags):

443

fp.seek(0, 2)

452

fp.seek(0, 2)

444

if prevtags and prevtags[-1] != '\n':

453

if prevtags and prevtags[-1] != '\n':

445

fp.write('\n')

454

fp.write('\n')

446

for name in names:

455

for name in names:

447

if munge:

456

if munge:

448

m = munge(name)

457

m = munge(name)

449

else:

458

else:

450

m = name

459

m = name

451

460

452

if (repo._tagscache.tagtypes and

461

if (repo._tagscache.tagtypes and

453

name in repo._tagscache.tagtypes):

462

name in repo._tagscache.tagtypes):

454

old = repo.tags().get(name, nullid)

463

old = repo.tags().get(name, nullid)

455

fp.write('%s %s\n' % (hex(old), m))

464

fp.write('%s %s\n' % (hex(old), m))

456

fp.write('%s %s\n' % (hex(node), m))

465

fp.write('%s %s\n' % (hex(node), m))

457

fp.close()

466

fp.close()

458

467

459

prevtags = ''

468

prevtags = ''

460

if local:

469

if local:

461

try:

470

try:

462

fp = repo.vfs('localtags', 'r+')

471

fp = repo.vfs('localtags', 'r+')

463

except IOError:

472

except IOError:

464

fp = repo.vfs('localtags', 'a')

473

fp = repo.vfs('localtags', 'a')

465

else:

474

else:

466

prevtags = fp.read()

475

prevtags = fp.read()

467

476

468

# local tags are stored in the current charset

477

# local tags are stored in the current charset

469

writetags(fp, names, None, prevtags)

478

writetags(fp, names, None, prevtags)

470

for name in names:

479

for name in names:

471

repo.hook('tag', node=hex(node), tag=name, local=local)

480

repo.hook('tag', node=hex(node), tag=name, local=local)

472

return

481

return

473

482

474

try:

483

try:

475

fp = repo.wvfs('.hgtags', 'rb+')

484

fp = repo.wvfs('.hgtags', 'rb+')

476

except IOError as e:

485

except IOError as e:

477

if e.errno != errno.ENOENT:

486

if e.errno != errno.ENOENT:

478

raise

487

raise

479

fp = repo.wvfs('.hgtags', 'ab')

488

fp = repo.wvfs('.hgtags', 'ab')

480

else:

489

else:

481

prevtags = fp.read()

490

prevtags = fp.read()

482

491

483

# committed tags are stored in UTF-8

492

# committed tags are stored in UTF-8

484

writetags(fp, names, encoding.fromlocal, prevtags)

493

writetags(fp, names, encoding.fromlocal, prevtags)

485

494

486

fp.close()

495

fp.close()

487

496

488

repo.invalidatecaches()

497

repo.invalidatecaches()

489

498

490

if '.hgtags' not in repo.dirstate:

499

if '.hgtags' not in repo.dirstate:

491

repo[None].add(['.hgtags'])

500

repo[None].add(['.hgtags'])

492

501

493

m = matchmod.exact(repo.root, '', ['.hgtags'])

502

m = matchmod.exact(repo.root, '', ['.hgtags'])

494

tagnode = repo.commit(message, user, date, extra=extra, match=m,

503

tagnode = repo.commit(message, user, date, extra=extra, match=m,

495

editor=editor)

504

editor=editor)

496

505

497

for name in names:

506

for name in names:

498

repo.hook('tag', node=hex(node), tag=name, local=local)

507

repo.hook('tag', node=hex(node), tag=name, local=local)

499

508

500

return tagnode

509

return tagnode

501

510

502

_fnodescachefile = 'cache/hgtagsfnodes1'

511

_fnodescachefile = 'cache/hgtagsfnodes1'

503

_fnodesrecsize = 4 + 20 # changeset fragment + filenode

512

_fnodesrecsize = 4 + 20 # changeset fragment + filenode

504

_fnodesmissingrec = '\xff' * 24

513

_fnodesmissingrec = '\xff' * 24

505

514

506

class hgtagsfnodescache(object):

515

class hgtagsfnodescache(object):

507

"""Persistent cache mapping revisions to .hgtags filenodes.

516

"""Persistent cache mapping revisions to .hgtags filenodes.

508

517

509

The cache is an array of records. Each item in the array corresponds to

518

The cache is an array of records. Each item in the array corresponds to

510

a changelog revision. Values in the array contain the first 4 bytes of

519

a changelog revision. Values in the array contain the first 4 bytes of

511

the node hash and the 20 bytes .hgtags filenode for that revision.

520

the node hash and the 20 bytes .hgtags filenode for that revision.

512

521

513

The first 4 bytes are present as a form of verification. Repository

522

The first 4 bytes are present as a form of verification. Repository

514

stripping and rewriting may change the node at a numeric revision in the

523

stripping and rewriting may change the node at a numeric revision in the

515

changelog. The changeset fragment serves as a verifier to detect

524

changelog. The changeset fragment serves as a verifier to detect

516

rewriting. This logic is shared with the rev branch cache (see

525

rewriting. This logic is shared with the rev branch cache (see

517

branchmap.py).

526

branchmap.py).

518

527

519

The instance holds in memory the full cache content but entries are

528

The instance holds in memory the full cache content but entries are

520

only parsed on read.

529

only parsed on read.

521

530

522

Instances behave like lists. ``c[i]`` works where i is a rev or

531

Instances behave like lists. ``c[i]`` works where i is a rev or

523

changeset node. Missing indexes are populated automatically on access.

532

changeset node. Missing indexes are populated automatically on access.

524

"""

533

"""

525

def __init__(self, repo):

534

def __init__(self, repo):

526

assert repo.filtername is None

535

assert repo.filtername is None

527

536

528

self._repo = repo

537

self._repo = repo

529

538

530

# Only for reporting purposes.

539

# Only for reporting purposes.

531

self.lookupcount = 0

540

self.lookupcount = 0

532

self.hitcount = 0

541

self.hitcount = 0

533

542

534

543

535

try:

544

try:

536

data = repo.vfs.read(_fnodescachefile)

545

data = repo.vfs.read(_fnodescachefile)

537

except (OSError, IOError):

546

except (OSError, IOError):

538

data = ""

547

data = ""

539

self._raw = bytearray(data)

548

self._raw = bytearray(data)

540

549

541

# The end state of self._raw is an array that is of the exact length

550

# The end state of self._raw is an array that is of the exact length

542

# required to hold a record for every revision in the repository.

551

# required to hold a record for every revision in the repository.

543

# We truncate or extend the array as necessary. self._dirtyoffset is

552

# We truncate or extend the array as necessary. self._dirtyoffset is

544

# defined to be the start offset at which we need to write the output

553

# defined to be the start offset at which we need to write the output

545

# file. This offset is also adjusted when new entries are calculated

554

# file. This offset is also adjusted when new entries are calculated

546

# for array members.

555

# for array members.

547

cllen = len(repo.changelog)

556

cllen = len(repo.changelog)

548

wantedlen = cllen * _fnodesrecsize

557

wantedlen = cllen * _fnodesrecsize

549

rawlen = len(self._raw)

558

rawlen = len(self._raw)

550

559

551

self._dirtyoffset = None

560

self._dirtyoffset = None

552

561

553

if rawlen < wantedlen:

562

if rawlen < wantedlen:

554

self._dirtyoffset = rawlen

563

self._dirtyoffset = rawlen

555

self._raw.extend('\xff' * (wantedlen - rawlen))

564

self._raw.extend('\xff' * (wantedlen - rawlen))

556

elif rawlen > wantedlen:

565

elif rawlen > wantedlen:

557

# There's no easy way to truncate array instances. This seems

566

# There's no easy way to truncate array instances. This seems

558

# slightly less evil than copying a potentially large array slice.

567

# slightly less evil than copying a potentially large array slice.

559

for i in range(rawlen - wantedlen):

568

for i in range(rawlen - wantedlen):

560

self._raw.pop()

569

self._raw.pop()

561

self._dirtyoffset = len(self._raw)

570

self._dirtyoffset = len(self._raw)

562

571

563

def getfnode(self, node, computemissing=True):

572

def getfnode(self, node, computemissing=True):

564

"""Obtain the filenode of the .hgtags file at a specified revision.

573

"""Obtain the filenode of the .hgtags file at a specified revision.

565

574

566

If the value is in the cache, the entry will be validated and returned.

575

If the value is in the cache, the entry will be validated and returned.

567

Otherwise, the filenode will be computed and returned unless

576

Otherwise, the filenode will be computed and returned unless

568

"computemissing" is False, in which case None will be returned without

577

"computemissing" is False, in which case None will be returned without

569

any potentially expensive computation being performed.

578

any potentially expensive computation being performed.

570

579

571

If an .hgtags does not exist at the specified revision, nullid is

580

If an .hgtags does not exist at the specified revision, nullid is

572

returned.

581

returned.

573

"""

582

"""

574

ctx = self._repo[node]

583

ctx = self._repo[node]

575

rev = ctx.rev()

584

rev = ctx.rev()

576

585

577

self.lookupcount += 1

586

self.lookupcount += 1

578

587

579

offset = rev * _fnodesrecsize

588

offset = rev * _fnodesrecsize

580

record = '%s' % self._raw[offset:offset + _fnodesrecsize]

589

record = '%s' % self._raw[offset:offset + _fnodesrecsize]

581

properprefix = node[0:4]

590

properprefix = node[0:4]

582

591

583

# Validate and return existing entry.

592

# Validate and return existing entry.

584

if record != _fnodesmissingrec:

593

if record != _fnodesmissingrec:

585

fileprefix = record[0:4]

594

fileprefix = record[0:4]

586

595

587

if fileprefix == properprefix:

596

if fileprefix == properprefix:

588

self.hitcount += 1

597

self.hitcount += 1

589

return record[4:]

598

return record[4:]

590

599

591

# Fall through.

600

# Fall through.

592

601

593

# If we get here, the entry is either missing or invalid.

602

# If we get here, the entry is either missing or invalid.

594

603

595

if not computemissing:

604

if not computemissing:

596

return None

605

return None

597

606

598

# Populate missing entry.

607

# Populate missing entry.

599

try:

608

try:

600

fnode = ctx.filenode('.hgtags')

609

fnode = ctx.filenode('.hgtags')

601

except error.LookupError:

610

except error.LookupError:

602

# No .hgtags file on this revision.

611

# No .hgtags file on this revision.

603

fnode = nullid

612

fnode = nullid

604

613

605

self._writeentry(offset, properprefix, fnode)

614

self._writeentry(offset, properprefix, fnode)

606

return fnode

615

return fnode

607

616

608

def setfnode(self, node, fnode):

617

def setfnode(self, node, fnode):

609

"""Set the .hgtags filenode for a given changeset."""

618

"""Set the .hgtags filenode for a given changeset."""

610

assert len(fnode) == 20

619

assert len(fnode) == 20

611

ctx = self._repo[node]

620

ctx = self._repo[node]

612

621

613

# Do a lookup first to avoid writing if nothing has changed.

622

# Do a lookup first to avoid writing if nothing has changed.

614

if self.getfnode(ctx.node(), computemissing=False) == fnode:

623

if self.getfnode(ctx.node(), computemissing=False) == fnode:

615

return

624

return

616

625

617

self._writeentry(ctx.rev() * _fnodesrecsize, node[0:4], fnode)

626

self._writeentry(ctx.rev() * _fnodesrecsize, node[0:4], fnode)

618

627

619

def _writeentry(self, offset, prefix, fnode):

628

def _writeentry(self, offset, prefix, fnode):

620

# Slices on array instances only accept other array.

629

# Slices on array instances only accept other array.

621

entry = bytearray(prefix + fnode)

630

entry = bytearray(prefix + fnode)

622

self._raw[offset:offset + _fnodesrecsize] = entry

631

self._raw[offset:offset + _fnodesrecsize] = entry

623

# self._dirtyoffset could be None.

632

# self._dirtyoffset could be None.

624

self._dirtyoffset = min(self._dirtyoffset, offset) or 0

633

self._dirtyoffset = min(self._dirtyoffset, offset) or 0

625

634

626

def write(self):

635

def write(self):

627

"""Perform all necessary writes to cache file.

636

"""Perform all necessary writes to cache file.

628

637

629

This may no-op if no writes are needed or if a write lock could

638

This may no-op if no writes are needed or if a write lock could

630

not be obtained.

639

not be obtained.

631

"""

640

"""

632

if self._dirtyoffset is None:

641

if self._dirtyoffset is None:

633

return

642

return

634

643

635

data = self._raw[self._dirtyoffset:]

644

data = self._raw[self._dirtyoffset:]

636

if not data:

645

if not data:

637

return

646

return

638

647

639

repo = self._repo

648

repo = self._repo

640

649

641

try:

650

try:

642

lock = repo.wlock(wait=False)

651

lock = repo.wlock(wait=False)

643

except error.LockError:

652

except error.LockError:

644

repo.ui.log('tagscache',

653

repo.ui.log('tagscache',

645

'not writing .hg/%s because lock cannot be acquired\n' %

654

'not writing .hg/%s because lock cannot be acquired\n' %

646

(_fnodescachefile))

655

(_fnodescachefile))

647

return

656

return

648

657

649

try:

658

try:

650

f = repo.vfs.open(_fnodescachefile, 'ab')

659

f = repo.vfs.open(_fnodescachefile, 'ab')

651

try:

660

try:

652

# if the file has been truncated

661

# if the file has been truncated

653

actualoffset = f.tell()

662

actualoffset = f.tell()

654

if actualoffset < self._dirtyoffset:

663

if actualoffset < self._dirtyoffset:

655

self._dirtyoffset = actualoffset

664

self._dirtyoffset = actualoffset

656

data = self._raw[self._dirtyoffset:]

665

data = self._raw[self._dirtyoffset:]

657

f.seek(self._dirtyoffset)

666

f.seek(self._dirtyoffset)

658

f.truncate()

667

f.truncate()

659

repo.ui.log('tagscache',

668

repo.ui.log('tagscache',

660

'writing %d bytes to %s\n' % (

669

'writing %d bytes to %s\n' % (

661

len(data), _fnodescachefile))

670

len(data), _fnodescachefile))

662

f.write(data)

671

f.write(data)

663

self._dirtyoffset = None

672

self._dirtyoffset = None

664

finally:

673

finally:

665

f.close()

674

f.close()

666

except (IOError, OSError) as inst:

675

except (IOError, OSError) as inst:

667

repo.ui.log('tagscache',

676

repo.ui.log('tagscache',

668

"couldn't write %s: %s\n" % (

677

"couldn't write %s: %s\n" % (

669

_fnodescachefile, inst))

678

_fnodescachefile, inst))

670

finally:

679

finally:

671

lock.release()

680

lock.release()

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             # tags.py - read tag info from local repository
             #
             # Copyright 2009 Matt Mackall <mpm@selenic.com>
             # Copyright 2009 Greg Ward <greg@gerg.ca>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             # Currently this module only deals with reading and caching tags.
             # Eventually, it could take care of updating (adding/removing/moving)
             # tags too.
             from __future__ import absolute_import
             import errno
             from .node import (
                 bin,
                 hex,
                 nullid,
                 short,
             )
             from .i18n import _
             from . import (
                 encoding,
                 error,
                 match as matchmod,
                 scmutil,
                 util,
             )
             # Tags computation can be expensive and caches exist to make it fast in
             # the common case.
             #
             # The "hgtagsfnodes1" cache file caches the .hgtags filenode values for
             # each revision in the repository. The file is effectively an array of
             # fixed length records. Read the docs for "hgtagsfnodescache" for technical
             # details.
             #
             # The .hgtags filenode cache grows in proportion to the length of the
             # changelog. The file is truncated when the # changelog is stripped.
             #
             # The purpose of the filenode cache is to avoid the most expensive part
             # of finding global tags, which is looking up the .hgtags filenode in the
             # manifest for each head. This can take dozens or over 100ms for
             # repositories with very large manifests. Multiplied by dozens or even
             # hundreds of heads and there is a significant performance concern.
             #
             # There also exist a separate cache file for each repository filter.
             # These "tags-*" files store information about the history of tags.
             #
             # The tags cache files consists of a cache validation line followed by
             # a history of tags.
             #
             # The cache validation line has the format:
             #
             #   <tiprev> <tipnode> [<filteredhash>]
             #
             # <tiprev> is an integer revision and <tipnode> is a 40 character hex
             # node for that changeset. These redundantly identify the repository
             # tip from the time the cache was written. In addition, <filteredhash>,
             # if present, is a 40 character hex hash of the contents of the filtered
             # revisions for this filter. If the set of filtered revs changes, the
             # hash will change and invalidate the cache.
             #
             # The history part of the tags cache consists of lines of the form:
             #
             #   <node> <tag>
             #
             # (This format is identical to that of .hgtags files.)
             #
             # <tag> is the tag name and <node> is the 40 character hex changeset
             # the tag is associated with.
             #
             # Tags are written sorted by tag name.
             #
             # Tags associated with multiple changesets have an entry for each changeset.
             # The most recent changeset (in terms of revlog ordering for the head
             # setting it) for each tag is last.
             def findglobaltags(ui, repo, alltags, tagtypes):
                 '''Find global tags in a repo.
                 "alltags" maps tag name to (node, hist) 2-tuples.
                 "tagtypes" maps tag name to tag type. Global tags always have the
                 "global" tag type.
                 The "alltags" and "tagtypes" dicts are updated in place. Empty dicts
                 should be passed in.
                 The tags cache is read and updated as a side-effect of calling.
                 '''
                 # This is so we can be lazy and assume alltags contains only global
                 # tags when we pass it to _writetagcache().
                 assert len(alltags) == len(tagtypes) == 0, \
                        "findglobaltags() should be called first"
                 (heads, tagfnode, valid, cachetags, shouldwrite) = _readtagcache(ui, repo)
                 if cachetags is not None:
                     assert not shouldwrite
                     # XXX is this really 100% correct?  are there oddball special
                     # cases where a global tag should outrank a local tag but won't,
                     # because cachetags does not contain rank info?
                     _updatetags(cachetags, 'global', alltags, tagtypes)
                     return
                 seen = set()  # set of fnode
                 fctx = None
                 for head in reversed(heads):  # oldest to newest
                     assert head in repo.changelog.nodemap, \
                            "tag cache returned bogus head %s" % short(head)
                     fnode = tagfnode.get(head)
                     if fnode and fnode not in seen:
                         seen.add(fnode)
                         if not fctx:
                             fctx = repo.filectx('.hgtags', fileid=fnode)
                         else:
                             fctx = fctx.filectx(fnode)
                         filetags = _readtags(ui, repo, fctx.data().splitlines(), fctx)
                         _updatetags(filetags, 'global', alltags, tagtypes)
                 # and update the cache (if necessary)
                 if shouldwrite:
                     _writetagcache(ui, repo, valid, alltags)
             def readlocaltags(ui, repo, alltags, tagtypes):
                 '''Read local tags in repo. Update alltags and tagtypes.'''
                 try:
                     data = repo.vfs.read("localtags")
                 except IOError as inst:
                     if inst.errno != errno.ENOENT:
                         raise
                     return
                 # localtags is in the local encoding; re-encode to UTF-8 on
                 # input for consistency with the rest of this module.
                 filetags = _readtags(
                     ui, repo, data.splitlines(), "localtags",
                     recode=encoding.fromlocal)
                 # remove tags pointing to invalid nodes
                 cl = repo.changelog
                 for t in filetags.keys():
                     try:
                         cl.rev(filetags[t][0])
                     except (LookupError, ValueError):
                         del filetags[t]
                 _updatetags(filetags, "local", alltags, tagtypes)
             def _readtaghist(ui, repo, lines, fn, recode=None, calcnodelines=False):
                 '''Read tag definitions from a file (or any source of lines).
                 This function returns two sortdicts with similar information:
                 - the first dict, bintaghist, contains the tag information as expected by
                   the _readtags function, i.e. a mapping from tag name to (node, hist):
                     - node is the node id from the last line read for that name,
                     - hist is the list of node ids previously associated with it (in file
                       order). All node ids are binary, not hex.
                 - the second dict, hextaglines, is a mapping from tag name to a list of
                   [hexnode, line number] pairs, ordered from the oldest to the newest node.
                 When calcnodelines is False the hextaglines dict is not calculated (an
                 empty dict is returned). This is done to improve this function's
                 performance in cases where the line numbers are not needed.
                 '''
                 bintaghist = util.sortdict()
                 hextaglines = util.sortdict()
                 count = 0
                 def dbg(msg):
                     ui.debug("%s, line %s: %s\n" % (fn, count, msg))
                 for nline, line in enumerate(lines):
                     count += 1
                     if not line:
                         continue
                     try:
                         (nodehex, name) = line.split(" ", 1)
                     except ValueError:
                         dbg("cannot parse entry")
                         continue
                     name = name.strip()
                     if recode:
                         name = recode(name)
                     try:
                         nodebin = bin(nodehex)
                     except TypeError:
                         dbg("node '%s' is not well formed" % nodehex)
                         continue
                     # update filetags
                     if calcnodelines:
                         # map tag name to a list of line numbers
                         if name not in hextaglines:
                             hextaglines[name] = []
                         hextaglines[name].append([nodehex, nline])
                         continue
                     # map tag name to (node, hist)
                     if name not in bintaghist:
                         bintaghist[name] = []
                     bintaghist[name].append(nodebin)
                 return bintaghist, hextaglines
             def _readtags(ui, repo, lines, fn, recode=None, calcnodelines=False):
                 '''Read tag definitions from a file (or any source of lines).
                 Returns a mapping from tag name to (node, hist).
                 "node" is the node id from the last line read for that name. "hist"
                 is the list of node ids previously associated with it (in file order).
                 All node ids are binary, not hex.
                 '''
                 filetags, nodelines = _readtaghist(ui, repo, lines, fn, recode=recode,
                                                    calcnodelines=calcnodelines)
                 # util.sortdict().__setitem__ is much slower at replacing then inserting
                 # new entries. The difference can matter if there are thousands of tags.
                 # Create a new sortdict to avoid the performance penalty.
                 newtags = util.sortdict()
                 for tag, taghist in filetags.items():
                     newtags[tag] = (taghist[-1], taghist[:-1])
                 return newtags
             def _updatetags(filetags, tagtype, alltags, tagtypes):
                 '''Incorporate the tag info read from one file into the two
                 dictionaries, alltags and tagtypes, that contain all tag
                 info (global across all heads plus local).'''
                 for name, nodehist in filetags.iteritems():
                     if name not in alltags:
                         alltags[name] = nodehist
                         tagtypes[name] = tagtype
                         continue
                     # we prefer alltags[name] if:
                     #  it supersedes us OR
                     #  mutual supersedes and it has a higher rank
                     # otherwise we win because we're tip-most
                     anode, ahist = nodehist
                     bnode, bhist = alltags[name]
                     if (bnode != anode and anode in bhist and
                         (bnode not in ahist or len(bhist) > len(ahist))):
                         anode = bnode
                     else:
                         tagtypes[name] = tagtype
                     ahist.extend([n for n in bhist if n not in ahist])
                     alltags[name] = anode, ahist
             def _filename(repo):
                 """name of a tagcache file for a given repo or repoview"""
                 filename = 'cache/tags2'
                 if repo.filtername:
                     filename = '%s-%s' % (filename, repo.filtername)
                 return filename
             def _readtagcache(ui, repo):
                 '''Read the tag cache.
                 Returns a tuple (heads, fnodes, validinfo, cachetags, shouldwrite).
                 If the cache is completely up-to-date, "cachetags" is a dict of the
                 form returned by _readtags() and "heads", "fnodes", and "validinfo" are
                 None and "shouldwrite" is False.
                 If the cache is not up to date, "cachetags" is None. "heads" is a list
                 of all heads currently in the repository, ordered from tip to oldest.
                 "validinfo" is a tuple describing cache validation info. This is used
                 when writing the tags cache. "fnodes" is a mapping from head to .hgtags
                 filenode. "shouldwrite" is True.
                 If the cache is not up to date, the caller is responsible for reading tag
                 info from each returned head. (See findglobaltags().)
                 '''
                 try:
                     cachefile = repo.vfs(_filename(repo), 'r')
                     # force reading the file for static-http
                     cachelines = iter(cachefile)
                 except IOError:
                     cachefile = None
                 cacherev = None
                 cachenode = None
                 cachehash = None
                 if cachefile:
                     try:
                         validline = next(cachelines)
                         validline = validline.split()
                         cacherev = int(validline[0])
                         cachenode = bin(validline[1])
                         if len(validline) > 2:
                             cachehash = bin(validline[2])
                     except Exception:
                         # corruption of the cache, just recompute it.
                         pass
                 tipnode = repo.changelog.tip()
                 tiprev = len(repo.changelog) - 1
                 # Case 1 (common): tip is the same, so nothing has changed.
                 # (Unchanged tip trivially means no changesets have been added.
                 # But, thanks to localrepository.destroyed(), it also means none
                 # have been destroyed by strip or rollback.)
                 if (cacherev == tiprev
                         and cachenode == tipnode
                         and cachehash == scmutil.filteredhash(repo, tiprev)):
                     tags = _readtags(ui, repo, cachelines, cachefile.name)
                     cachefile.close()
                     return (None, None, None, tags, False)
                 if cachefile:
                     cachefile.close()               # ignore rest of file
                 valid = (tiprev, tipnode, scmutil.filteredhash(repo, tiprev))
                 repoheads = repo.heads()
                 # Case 2 (uncommon): empty repo; get out quickly and don't bother
                 # writing an empty cache.
                 if repoheads == [nullid]:
                     return ([], {}, valid, {}, False)
                 # Case 3 (uncommon): cache file missing or empty.
                 # Case 4 (uncommon): tip rev decreased.  This should only happen
                 # when we're called from localrepository.destroyed().  Refresh the
                 # cache so future invocations will not see disappeared heads in the
                 # cache.
                 # Case 5 (common): tip has changed, so we've added/replaced heads.
                 # As it happens, the code to handle cases 3, 4, 5 is the same.
                 # N.B. in case 4 (nodes destroyed), "new head" really means "newly
                 # exposed".
                 if not len(repo.file('.hgtags')):
                     # No tags have ever been committed, so we can avoid a
                     # potentially expensive search.
                     return ([], {}, valid, None, True)
-                starttime = util.timer()
                 # Now we have to lookup the .hgtags filenode for every new head.
                 # This is the most expensive part of finding tags, so performance
                 # depends primarily on the size of newheads.  Worst case: no cache
                 # file, so newheads == repoheads.
+                cachefnode = _getfnodes(ui, repo, repoheads)
+                # Caller has to iterate over all heads, but can use the filenodes in
+                # cachefnode to get to each .hgtags revision quickly.
+                return (repoheads, cachefnode, valid, None, True)
+            def _getfnodes(ui, repo, nodes):
+                """return .hgtags fnodes for a list of changeset nodes
+                Return value is a {node: fnode} mapping. There will be no entry for nodes
+                without a '.hgtags' file.
+                """
+                starttime = util.timer()
                 fnodescache = hgtagsfnodescache(repo.unfiltered())
                 cachefnode = {}
-                for head in reversed(repoheads):
+                for head in reversed(nodes):
                     fnode = fnodescache.getfnode(head)
                     if fnode != nullid:
                         cachefnode[head] = fnode
                 fnodescache.write()
                 duration = util.timer() - starttime
                 ui.log('tagscache',
                        '%d/%d cache hits/lookups in %0.4f '
                        'seconds\n',
                        fnodescache.hitcount, fnodescache.lookupcount, duration)
+                return cachefnode
-                # Caller has to iterate over all heads, but can use the filenodes in
-                # cachefnode to get to each .hgtags revision quickly.
-                return (repoheads, cachefnode, valid, None, True)
             def _writetagcache(ui, repo, valid, cachetags):
                 filename = _filename(repo)
                 try:
                     cachefile = repo.vfs(filename, 'w', atomictemp=True)
                 except (OSError, IOError):
                     return
                 ui.log('tagscache', 'writing .hg/%s with %d tags\n',
                        filename, len(cachetags))
                 if valid[2]:
                     cachefile.write('%d %s %s\n' % (valid[0], hex(valid[1]), hex(valid[2])))
                 else:
                     cachefile.write('%d %s\n' % (valid[0], hex(valid[1])))
                 # Tag names in the cache are in UTF-8 -- which is the whole reason
                 # we keep them in UTF-8 throughout this module.  If we converted
                 # them local encoding on input, we would lose info writing them to
                 # the cache.
                 for (name, (node, hist)) in sorted(cachetags.iteritems()):
                     for n in hist:
                         cachefile.write("%s %s\n" % (hex(n), name))
                     cachefile.write("%s %s\n" % (hex(node), name))
                 try:
                     cachefile.close()
                 except (OSError, IOError):
                     pass
             def tag(repo, names, node, message, local, user, date, editor=False):
                 '''tag a revision with one or more symbolic names.
                 names is a list of strings or, when adding a single tag, names may be a
                 string.
                 if local is True, the tags are stored in a per-repository file.
                 otherwise, they are stored in the .hgtags file, and a new
                 changeset is committed with the change.
                 keyword arguments:
                 local: whether to store tags in non-version-controlled file
                 (default False)
                 message: commit message to use if committing
                 user: name of user to use if committing
                 date: date tuple to use if committing'''
                 if not local:
                     m = matchmod.exact(repo.root, '', ['.hgtags'])
                     if any(repo.status(match=m, unknown=True, ignored=True)):
                         raise error.Abort(_('working copy of .hgtags is changed'),
                                          hint=_('please commit .hgtags manually'))
                 repo.tags() # instantiate the cache
                 _tag(repo.unfiltered(), names, node, message, local, user, date,
                      editor=editor)
             def _tag(repo, names, node, message, local, user, date, extra=None,
                      editor=False):
                 if isinstance(names, str):
                     names = (names,)
                 branches = repo.branchmap()
                 for name in names:
                     repo.hook('pretag', throw=True, node=hex(node), tag=name,
                               local=local)
                     if name in branches:
                         repo.ui.warn(_("warning: tag %s conflicts with existing"
                         " branch name\n") % name)
                 def writetags(fp, names, munge, prevtags):
                     fp.seek(0, 2)
                     if prevtags and prevtags[-1] != '\n':
                         fp.write('\n')
                     for name in names:
                         if munge:
                             m = munge(name)
                         else:
                             m = name
                         if (repo._tagscache.tagtypes and
                             name in repo._tagscache.tagtypes):
                             old = repo.tags().get(name, nullid)
                             fp.write('%s %s\n' % (hex(old), m))
                         fp.write('%s %s\n' % (hex(node), m))
                     fp.close()
                 prevtags = ''
                 if local:
                     try:
                         fp = repo.vfs('localtags', 'r+')
                     except IOError:
                         fp = repo.vfs('localtags', 'a')
                     else:
                         prevtags = fp.read()
                     # local tags are stored in the current charset
                     writetags(fp, names, None, prevtags)
                     for name in names:
                         repo.hook('tag', node=hex(node), tag=name, local=local)
                     return
                 try:
                     fp = repo.wvfs('.hgtags', 'rb+')
                 except IOError as e:
                     if e.errno != errno.ENOENT:
                         raise
                     fp = repo.wvfs('.hgtags', 'ab')
                 else:
                     prevtags = fp.read()
                 # committed tags are stored in UTF-8
                 writetags(fp, names, encoding.fromlocal, prevtags)
                 fp.close()
                 repo.invalidatecaches()
                 if '.hgtags' not in repo.dirstate:
                     repo[None].add(['.hgtags'])
                 m = matchmod.exact(repo.root, '', ['.hgtags'])
                 tagnode = repo.commit(message, user, date, extra=extra, match=m,
                                       editor=editor)
                 for name in names:
                     repo.hook('tag', node=hex(node), tag=name, local=local)
                 return tagnode
             _fnodescachefile = 'cache/hgtagsfnodes1'
             _fnodesrecsize = 4 + 20 # changeset fragment + filenode
             _fnodesmissingrec = '\xff' * 24
             class hgtagsfnodescache(object):
                 """Persistent cache mapping revisions to .hgtags filenodes.
                 The cache is an array of records. Each item in the array corresponds to
                 a changelog revision. Values in the array contain the first 4 bytes of
                 the node hash and the 20 bytes .hgtags filenode for that revision.
                 The first 4 bytes are present as a form of verification. Repository
                 stripping and rewriting may change the node at a numeric revision in the
                 changelog. The changeset fragment serves as a verifier to detect
                 rewriting. This logic is shared with the rev branch cache (see
                 branchmap.py).
                 The instance holds in memory the full cache content but entries are
                 only parsed on read.
                 Instances behave like lists. ``c[i]`` works where i is a rev or
                 changeset node. Missing indexes are populated automatically on access.
                 """
                 def __init__(self, repo):
                     assert repo.filtername is None
                     self._repo = repo
                     # Only for reporting purposes.
                     self.lookupcount = 0
                     self.hitcount = 0
                     try:
                         data = repo.vfs.read(_fnodescachefile)
                     except (OSError, IOError):
                         data = ""
                     self._raw = bytearray(data)
                     # The end state of self._raw is an array that is of the exact length
                     # required to hold a record for every revision in the repository.
                     # We truncate or extend the array as necessary. self._dirtyoffset is
                     # defined to be the start offset at which we need to write the output
                     # file. This offset is also adjusted when new entries are calculated
                     # for array members.
                     cllen = len(repo.changelog)
                     wantedlen = cllen * _fnodesrecsize
                     rawlen = len(self._raw)
                     self._dirtyoffset = None
                     if rawlen < wantedlen:
                         self._dirtyoffset = rawlen
                         self._raw.extend('\xff' * (wantedlen - rawlen))
                     elif rawlen > wantedlen:
                         # There's no easy way to truncate array instances. This seems
                         # slightly less evil than copying a potentially large array slice.
                         for i in range(rawlen - wantedlen):
                             self._raw.pop()
                         self._dirtyoffset = len(self._raw)
                 def getfnode(self, node, computemissing=True):
                     """Obtain the filenode of the .hgtags file at a specified revision.
                     If the value is in the cache, the entry will be validated and returned.
                     Otherwise, the filenode will be computed and returned unless
                     "computemissing" is False, in which case None will be returned without
                     any potentially expensive computation being performed.
                     If an .hgtags does not exist at the specified revision, nullid is
                     returned.
                     """
                     ctx = self._repo[node]
                     rev = ctx.rev()
                     self.lookupcount += 1
                     offset = rev * _fnodesrecsize
                     record = '%s' % self._raw[offset:offset + _fnodesrecsize]
                     properprefix = node[0:4]
                     # Validate and return existing entry.
                     if record != _fnodesmissingrec:
                         fileprefix = record[0:4]
                         if fileprefix == properprefix:
                             self.hitcount += 1
                             return record[4:]
                         # Fall through.
                     # If we get here, the entry is either missing or invalid.
                     if not computemissing:
                         return None
                     # Populate missing entry.
                     try:
                         fnode = ctx.filenode('.hgtags')
                     except error.LookupError:
                         # No .hgtags file on this revision.
                         fnode = nullid
                     self._writeentry(offset, properprefix, fnode)
                     return fnode
                 def setfnode(self, node, fnode):
                     """Set the .hgtags filenode for a given changeset."""
                     assert len(fnode) == 20
                     ctx = self._repo[node]
                     # Do a lookup first to avoid writing if nothing has changed.
                     if self.getfnode(ctx.node(), computemissing=False) == fnode:
                         return
                     self._writeentry(ctx.rev() * _fnodesrecsize, node[0:4], fnode)
                 def _writeentry(self, offset, prefix, fnode):
                     # Slices on array instances only accept other array.
                     entry = bytearray(prefix + fnode)
                     self._raw[offset:offset + _fnodesrecsize] = entry
                     # self._dirtyoffset could be None.
                     self._dirtyoffset = min(self._dirtyoffset, offset) or 0
                 def write(self):
                     """Perform all necessary writes to cache file.
                     This may no-op if no writes are needed or if a write lock could
                     not be obtained.
                     """
                     if self._dirtyoffset is None:
                         return
                     data = self._raw[self._dirtyoffset:]
                     if not data:
                         return
                     repo = self._repo
                     try:
                         lock = repo.wlock(wait=False)
                     except error.LockError:
                         repo.ui.log('tagscache',
                                     'not writing .hg/%s because lock cannot be acquired\n' %
                                     (_fnodescachefile))
                         return
                     try:
                         f = repo.vfs.open(_fnodescachefile, 'ab')
                         try:
                             # if the file has been truncated
                             actualoffset = f.tell()
                             if actualoffset < self._dirtyoffset:
                                 self._dirtyoffset = actualoffset
                                 data = self._raw[self._dirtyoffset:]
                             f.seek(self._dirtyoffset)
                             f.truncate()
                             repo.ui.log('tagscache',
                                         'writing %d bytes to %s\n' % (
                                         len(data), _fnodescachefile))
                             f.write(data)
                             self._dirtyoffset = None
                         finally:
                             f.close()
                     except (IOError, OSError) as inst:
                         repo.ui.log('tagscache',
                                     "couldn't write %s: %s\n" % (
                                     _fnodescachefile, inst))
                     finally:
                         lock.release()