##// END OF EJS Templates
convert: Clean up authormap key=value splitting....
Marti Raudsepp -
r6186:aae4eb2f default
parent child Browse files
Show More
@@ -1,351 +1,352 b''
1 1 # convcmd - convert extension commands definition
2 2 #
3 3 # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
4 4 #
5 5 # This software may be used and distributed according to the terms
6 6 # of the GNU General Public License, incorporated herein by reference.
7 7
8 8 from common import NoRepo, SKIPREV, converter_source, converter_sink, mapfile
9 9 from cvs import convert_cvs
10 10 from darcs import darcs_source
11 11 from git import convert_git
12 12 from hg import mercurial_source, mercurial_sink
13 13 from subversion import debugsvnlog, svn_source, svn_sink
14 14 from gnuarch import gnuarch_source
15 15 import filemap
16 16
17 17 import os, shutil
18 18 from mercurial import hg, util
19 19 from mercurial.i18n import _
20 20
21 21 orig_encoding = 'ascii'
22 22
23 23 def recode(s):
24 24 if isinstance(s, unicode):
25 25 return s.encode(orig_encoding, 'replace')
26 26 else:
27 27 return s.decode('utf-8').encode(orig_encoding, 'replace')
28 28
29 29 source_converters = [
30 30 ('cvs', convert_cvs),
31 31 ('git', convert_git),
32 32 ('svn', svn_source),
33 33 ('hg', mercurial_source),
34 34 ('darcs', darcs_source),
35 35 ('gnuarch', gnuarch_source),
36 36 ]
37 37
38 38 sink_converters = [
39 39 ('hg', mercurial_sink),
40 40 ('svn', svn_sink),
41 41 ]
42 42
43 43 def convertsource(ui, path, type, rev):
44 44 exceptions = []
45 45 for name, source in source_converters:
46 46 try:
47 47 if not type or name == type:
48 48 return source(ui, path, rev)
49 49 except NoRepo, inst:
50 50 exceptions.append(inst)
51 51 if not ui.quiet:
52 52 for inst in exceptions:
53 53 ui.write(_("%s\n") % inst)
54 54 raise util.Abort('%s: unknown repository type' % path)
55 55
56 56 def convertsink(ui, path, type):
57 57 for name, sink in sink_converters:
58 58 try:
59 59 if not type or name == type:
60 60 return sink(ui, path)
61 61 except NoRepo, inst:
62 62 ui.note(_("convert: %s\n") % inst)
63 63 raise util.Abort('%s: unknown repository type' % path)
64 64
65 65 class converter(object):
66 66 def __init__(self, ui, source, dest, revmapfile, opts):
67 67
68 68 self.source = source
69 69 self.dest = dest
70 70 self.ui = ui
71 71 self.opts = opts
72 72 self.commitcache = {}
73 73 self.authors = {}
74 74 self.authorfile = None
75 75
76 76 self.map = mapfile(ui, revmapfile)
77 77
78 78 # Read first the dst author map if any
79 79 authorfile = self.dest.authorfile()
80 80 if authorfile and os.path.exists(authorfile):
81 81 self.readauthormap(authorfile)
82 82 # Extend/Override with new author map if necessary
83 83 if opts.get('authors'):
84 84 self.readauthormap(opts.get('authors'))
85 85 self.authorfile = self.dest.authorfile()
86 86
87 87 self.splicemap = mapfile(ui, opts.get('splicemap'))
88 88
89 89 def walktree(self, heads):
90 90 '''Return a mapping that identifies the uncommitted parents of every
91 91 uncommitted changeset.'''
92 92 visit = heads
93 93 known = {}
94 94 parents = {}
95 95 while visit:
96 96 n = visit.pop(0)
97 97 if n in known or n in self.map: continue
98 98 known[n] = 1
99 99 commit = self.cachecommit(n)
100 100 parents[n] = []
101 101 for p in commit.parents:
102 102 parents[n].append(p)
103 103 visit.append(p)
104 104
105 105 return parents
106 106
107 107 def toposort(self, parents):
108 108 '''Return an ordering such that every uncommitted changeset is
109 109 preceeded by all its uncommitted ancestors.'''
110 110 visit = parents.keys()
111 111 seen = {}
112 112 children = {}
113 113 actives = []
114 114
115 115 while visit:
116 116 n = visit.pop(0)
117 117 if n in seen: continue
118 118 seen[n] = 1
119 119 # Ensure that nodes without parents are present in the 'children'
120 120 # mapping.
121 121 children.setdefault(n, [])
122 122 hasparent = False
123 123 for p in parents[n]:
124 124 if not p in self.map:
125 125 visit.append(p)
126 126 hasparent = True
127 127 children.setdefault(p, []).append(n)
128 128 if not hasparent:
129 129 actives.append(n)
130 130
131 131 del seen
132 132 del visit
133 133
134 134 if self.opts.get('datesort'):
135 135 dates = {}
136 136 def getdate(n):
137 137 if n not in dates:
138 138 dates[n] = util.parsedate(self.commitcache[n].date)
139 139 return dates[n]
140 140
141 141 def picknext(nodes):
142 142 return min([(getdate(n), n) for n in nodes])[1]
143 143 else:
144 144 prev = [None]
145 145 def picknext(nodes):
146 146 # Return the first eligible child of the previously converted
147 147 # revision, or any of them.
148 148 next = nodes[0]
149 149 for n in nodes:
150 150 if prev[0] in parents[n]:
151 151 next = n
152 152 break
153 153 prev[0] = next
154 154 return next
155 155
156 156 s = []
157 157 pendings = {}
158 158 while actives:
159 159 n = picknext(actives)
160 160 actives.remove(n)
161 161 s.append(n)
162 162
163 163 # Update dependents list
164 164 for c in children.get(n, []):
165 165 if c not in pendings:
166 166 pendings[c] = [p for p in parents[c] if p not in self.map]
167 167 try:
168 168 pendings[c].remove(n)
169 169 except ValueError:
170 170 raise util.Abort(_('cycle detected between %s and %s')
171 171 % (recode(c), recode(n)))
172 172 if not pendings[c]:
173 173 # Parents are converted, node is eligible
174 174 actives.insert(0, c)
175 175 pendings[c] = None
176 176
177 177 if len(s) != len(parents):
178 178 raise util.Abort(_("not all revisions were sorted"))
179 179
180 180 return s
181 181
182 182 def writeauthormap(self):
183 183 authorfile = self.authorfile
184 184 if authorfile:
185 185 self.ui.status('Writing author map file %s\n' % authorfile)
186 186 ofile = open(authorfile, 'w+')
187 187 for author in self.authors:
188 188 ofile.write("%s=%s\n" % (author, self.authors[author]))
189 189 ofile.close()
190 190
191 191 def readauthormap(self, authorfile):
192 192 afile = open(authorfile, 'r')
193 193 for line in afile:
194 194 if line.strip() == '':
195 195 continue
196 196 try:
197 srcauthor = line.split('=')[0].strip()
198 dstauthor = line.split('=')[1].strip()
197 srcauthor, dstauthor = line.split('=', 1)
198 srcauthor = srcauthor.strip()
199 dstauthor = dstauthor.strip()
199 200 if srcauthor in self.authors and dstauthor != self.authors[srcauthor]:
200 201 self.ui.status(
201 202 'Overriding mapping for author %s, was %s, will be %s\n'
202 203 % (srcauthor, self.authors[srcauthor], dstauthor))
203 204 else:
204 205 self.ui.debug('Mapping author %s to %s\n'
205 206 % (srcauthor, dstauthor))
206 207 self.authors[srcauthor] = dstauthor
207 208 except IndexError:
208 209 self.ui.warn(
209 210 'Ignoring bad line in author map file %s: %s\n'
210 211 % (authorfile, line.rstrip()))
211 212 afile.close()
212 213
213 214 def cachecommit(self, rev):
214 215 commit = self.source.getcommit(rev)
215 216 commit.author = self.authors.get(commit.author, commit.author)
216 217 self.commitcache[rev] = commit
217 218 return commit
218 219
219 220 def copy(self, rev):
220 221 commit = self.commitcache[rev]
221 222 do_copies = hasattr(self.dest, 'copyfile')
222 223 filenames = []
223 224
224 225 changes = self.source.getchanges(rev)
225 226 if isinstance(changes, basestring):
226 227 if changes == SKIPREV:
227 228 dest = SKIPREV
228 229 else:
229 230 dest = self.map[changes]
230 231 self.map[rev] = dest
231 232 return
232 233 files, copies = changes
233 234 pbranches = []
234 235 if commit.parents:
235 236 for prev in commit.parents:
236 237 if prev not in self.commitcache:
237 238 self.cachecommit(prev)
238 239 pbranches.append((self.map[prev],
239 240 self.commitcache[prev].branch))
240 241 self.dest.setbranch(commit.branch, pbranches)
241 242 for f, v in files:
242 243 filenames.append(f)
243 244 try:
244 245 data = self.source.getfile(f, v)
245 246 except IOError, inst:
246 247 self.dest.delfile(f)
247 248 else:
248 249 e = self.source.getmode(f, v)
249 250 self.dest.putfile(f, e, data)
250 251 if do_copies:
251 252 if f in copies:
252 253 copyf = copies[f]
253 254 # Merely marks that a copy happened.
254 255 self.dest.copyfile(copyf, f)
255 256
256 257 try:
257 258 parents = self.splicemap[rev].replace(',', ' ').split()
258 259 self.ui.status('spliced in %s as parents of %s\n' %
259 260 (parents, rev))
260 261 parents = [self.map.get(p, p) for p in parents]
261 262 except KeyError:
262 263 parents = [b[0] for b in pbranches]
263 264 newnode = self.dest.putcommit(filenames, parents, commit)
264 265 self.source.converted(rev, newnode)
265 266 self.map[rev] = newnode
266 267
267 268 def convert(self):
268 269
269 270 try:
270 271 self.source.before()
271 272 self.dest.before()
272 273 self.source.setrevmap(self.map)
273 274 self.ui.status("scanning source...\n")
274 275 heads = self.source.getheads()
275 276 parents = self.walktree(heads)
276 277 self.ui.status("sorting...\n")
277 278 t = self.toposort(parents)
278 279 num = len(t)
279 280 c = None
280 281
281 282 self.ui.status("converting...\n")
282 283 for c in t:
283 284 num -= 1
284 285 desc = self.commitcache[c].desc
285 286 if "\n" in desc:
286 287 desc = desc.splitlines()[0]
287 288 # convert log message to local encoding without using
288 289 # tolocal() because util._encoding conver() use it as
289 290 # 'utf-8'
290 291 self.ui.status("%d %s\n" % (num, recode(desc)))
291 292 self.ui.note(_("source: %s\n" % recode(c)))
292 293 self.copy(c)
293 294
294 295 tags = self.source.gettags()
295 296 ctags = {}
296 297 for k in tags:
297 298 v = tags[k]
298 299 if self.map.get(v, SKIPREV) != SKIPREV:
299 300 ctags[k] = self.map[v]
300 301
301 302 if c and ctags:
302 303 nrev = self.dest.puttags(ctags)
303 304 # write another hash correspondence to override the previous
304 305 # one so we don't end up with extra tag heads
305 306 if nrev:
306 307 self.map[c] = nrev
307 308
308 309 self.writeauthormap()
309 310 finally:
310 311 self.cleanup()
311 312
312 313 def cleanup(self):
313 314 try:
314 315 self.dest.after()
315 316 finally:
316 317 self.source.after()
317 318 self.map.close()
318 319
319 320 def convert(ui, src, dest=None, revmapfile=None, **opts):
320 321 global orig_encoding
321 322 orig_encoding = util._encoding
322 323 util._encoding = 'UTF-8'
323 324
324 325 if not dest:
325 326 dest = hg.defaultdest(src) + "-hg"
326 327 ui.status("assuming destination %s\n" % dest)
327 328
328 329 destc = convertsink(ui, dest, opts.get('dest_type'))
329 330
330 331 try:
331 332 srcc = convertsource(ui, src, opts.get('source_type'),
332 333 opts.get('rev'))
333 334 except Exception:
334 335 for path in destc.created:
335 336 shutil.rmtree(path, True)
336 337 raise
337 338
338 339 fmap = opts.get('filemap')
339 340 if fmap:
340 341 srcc = filemap.filemap_source(ui, srcc, fmap)
341 342 destc.setfilemapmode(True)
342 343
343 344 if not revmapfile:
344 345 try:
345 346 revmapfile = destc.revmapfile()
346 347 except:
347 348 revmapfile = os.path.join(destc, "map")
348 349
349 350 c = converter(ui, srcc, destc, revmapfile, opts)
350 351 c.convert()
351 352
General Comments 0
You need to be logged in to leave comments. Login now