##// END OF EJS Templates
tags: improve documentation...
Gregory Szorc -
r24445:c71edbaf default
parent child Browse files
Show More
@@ -18,12 +18,61 import error
18 18 import errno
19 19 import time
20 20
21 # The tags cache stores information about heads and the history of tags.
22 #
23 # The cache file consists of two parts. The first part maps head nodes
24 # to .hgtags filenodes. The second part is a history of tags. The two
25 # parts are separated by an empty line.
26 #
27 # The first part consists of lines of the form:
28 #
29 # <headrev> <headnode> [<hgtagsnode>]
30 #
31 # <headrev> is an integer revision and <headnode> is a 40 character hex
32 # node for that changeset. These redundantly identify a repository
33 # head from the time the cache was written.
34 #
35 # <tagnode> is the filenode of .hgtags on that head. Heads with no .hgtags
36 # file will have no <hgtagsnode> (just 2 values per line).
37 #
38 # The filenode cache is ordered from tip to oldest (which is part of why
39 # <headrev> is there: a quick check of the tip from when the cache was
40 # written against the current tip is all that is needed to check whether
41 # the cache is up to date).
42 #
43 # The purpose of the filenode cache is to avoid the most expensive part
44 # of finding global tags, which is looking up the .hgtags filenode in the
45 # manifest for each head. This can take over a minute on repositories
46 # that have large manifests and many heads.
47 #
48 # The second part of the tags cache consists of lines of the form:
49 #
50 # <node> <tag>
51 #
52 # (This format is identical to that of .hgtags files.)
53 #
54 # <tag> is the tag name and <node> is the 40 character hex changeset
55 # the tag is associated with.
56 #
57 # Tags are written sorted by tag name.
58 #
59 # Tags associated with multiple changesets have an entry for each changeset.
60 # The most recent changeset (in terms of revlog ordering for the head
61 # setting it) for each tag is last.
62
21 63 def findglobaltags(ui, repo, alltags, tagtypes):
22 '''Find global tags in repo by reading .hgtags from every head that
23 has a distinct version of it, using a cache to avoid excess work.
24 Updates the dicts alltags, tagtypes in place: alltags maps tag name
25 to (node, hist) pair (see _readtags() below), and tagtypes maps tag
26 name to tag type ("global" in this case).'''
64 '''Find global tags in a repo.
65
66 "alltags" maps tag name to (node, hist) 2-tuples.
67
68 "tagtypes" maps tag name to tag type. Global tags always have the
69 "global" tag type.
70
71 The "alltags" and "tagtypes" dicts are updated in place. Empty dicts
72 should be passed in.
73
74 The tags cache is read and updated as a side-effect of calling.
75 '''
27 76 # This is so we can be lazy and assume alltags contains only global
28 77 # tags when we pass it to _writetagcache().
29 78 assert len(alltags) == len(tagtypes) == 0, \
@@ -86,14 +135,18 def readlocaltags(ui, repo, alltags, tag
86 135
87 136 def _readtaghist(ui, repo, lines, fn, recode=None, calcnodelines=False):
88 137 '''Read tag definitions from a file (or any source of lines).
138
89 139 This function returns two sortdicts with similar information:
140
90 141 - the first dict, bintaghist, contains the tag information as expected by
91 142 the _readtags function, i.e. a mapping from tag name to (node, hist):
92 143 - node is the node id from the last line read for that name,
93 144 - hist is the list of node ids previously associated with it (in file
94 145 order). All node ids are binary, not hex.
146
95 147 - the second dict, hextaglines, is a mapping from tag name to a list of
96 148 [hexnode, line number] pairs, ordered from the oldest to the newest node.
149
97 150 When calcnodelines is False the hextaglines dict is not calculated (an
98 151 empty dict is returned). This is done to improve this function's
99 152 performance in cases where the line numbers are not needed.
@@ -139,10 +192,13 def _readtaghist(ui, repo, lines, fn, re
139 192
140 193 def _readtags(ui, repo, lines, fn, recode=None, calcnodelines=False):
141 194 '''Read tag definitions from a file (or any source of lines).
142 Return a mapping from tag name to (node, hist): node is the node id
143 from the last line read for that name, and hist is the list of node
144 ids previously associated with it (in file order). All node ids are
145 binary, not hex.'''
195
196 Returns a mapping from tag name to (node, hist).
197
198 "node" is the node id from the last line read for that name. "hist"
199 is the list of node ids previously associated with it (in file order).
200 All node ids are binary, not hex.
201 '''
146 202 filetags, nodelines = _readtaghist(ui, repo, lines, fn, recode=recode,
147 203 calcnodelines=calcnodelines)
148 204 for tag, taghist in filetags.items():
@@ -174,23 +230,23 def _updatetags(filetags, tagtype, allta
174 230 ahist.extend([n for n in bhist if n not in ahist])
175 231 alltags[name] = anode, ahist
176 232
233 def _readtagcache(ui, repo):
234 '''Read the tag cache.
177 235
178 # The tag cache only stores info about heads, not the tag contents
179 # from each head. I.e. it doesn't try to squeeze out the maximum
180 # performance, but is simpler has a better chance of actually
181 # working correctly. And this gives the biggest performance win: it
182 # avoids looking up .hgtags in the manifest for every head, and it
183 # can avoid calling heads() at all if there have been no changes to
184 # the repo.
236 Returns a tuple (heads, fnodes, cachetags, shouldwrite).
237
238 If the cache is completely up-to-date, "cachetags" is a dict of the
239 form returned by _readtags() and "heads" and "fnodes" are None and
240 "shouldwrite" is False.
185 241
186 def _readtagcache(ui, repo):
187 '''Read the tag cache and return a tuple (heads, fnodes, cachetags,
188 shouldwrite). If the cache is completely up-to-date, cachetags is a
189 dict of the form returned by _readtags(); otherwise, it is None and
190 heads and fnodes are set. In that case, heads is the list of all
191 heads currently in the repository (ordered from tip to oldest) and
192 fnodes is a mapping from head to .hgtags filenode. If those two are
193 set, caller is responsible for reading tag info from each head.'''
242 If the cache is not up to date, "cachetags" is None. "heads" is a list
243 of all heads currently in the repository, ordered from tip to oldest.
244 "fnodes" is a mapping from head to .hgtags filenode. "shouldwrite" is
245 True.
246
247 If the cache is not up to date, the caller is responsible for reading tag
248 info from each returned head. (See findglobaltags().)
249 '''
194 250
195 251 try:
196 252 cachefile = repo.vfs('cache/tags', 'r')
@@ -199,18 +255,6 def _readtagcache(ui, repo):
199 255 except IOError:
200 256 cachefile = None
201 257
202 # The cache file consists of lines like
203 # <headrev> <headnode> [<tagnode>]
204 # where <headrev> and <headnode> redundantly identify a repository
205 # head from the time the cache was written, and <tagnode> is the
206 # filenode of .hgtags on that head. Heads with no .hgtags file will
207 # have no <tagnode>. The cache is ordered from tip to oldest (which
208 # is part of why <headrev> is there: a quick visual check is all
209 # that's required to ensure correct order).
210 #
211 # This information is enough to let us avoid the most expensive part
212 # of finding global tags, which is looking up <tagnode> in the
213 # manifest for each head.
214 258 cacherevs = [] # list of headrev
215 259 cacheheads = [] # list of headnode
216 260 cachefnode = {} # map headnode to filenode
@@ -301,7 +345,6 def _readtagcache(ui, repo):
301 345 return (repoheads, cachefnode, None, True)
302 346
303 347 def _writetagcache(ui, repo, heads, tagfnode, cachetags):
304
305 348 try:
306 349 cachefile = repo.vfs('cache/tags', 'w', atomictemp=True)
307 350 except (OSError, IOError):
General Comments 0
You need to be logged in to leave comments. Login now