##// END OF EJS Templates
convert: unescape Perforce-escaped special characters in filenames
Eugene Baranov -
r25788:a36fd099 default
parent child Browse files
Show More
@@ -1,270 +1,284 b''
1 # Perforce source for convert extension.
1 # Perforce source for convert extension.
2 #
2 #
3 # Copyright 2009, Frank Kingswood <frank@kingswood-consulting.co.uk>
3 # Copyright 2009, Frank Kingswood <frank@kingswood-consulting.co.uk>
4 #
4 #
5 # This software may be used and distributed according to the terms of the
5 # This software may be used and distributed according to the terms of the
6 # GNU General Public License version 2 or any later version.
6 # GNU General Public License version 2 or any later version.
7
7
8 from mercurial import util
8 from mercurial import util
9 from mercurial.i18n import _
9 from mercurial.i18n import _
10
10
11 from common import commit, converter_source, checktool, NoRepo
11 from common import commit, converter_source, checktool, NoRepo
12 import marshal
12 import marshal
13 import re
13 import re
14
14
15 def loaditer(f):
15 def loaditer(f):
16 "Yield the dictionary objects generated by p4"
16 "Yield the dictionary objects generated by p4"
17 try:
17 try:
18 while True:
18 while True:
19 d = marshal.load(f)
19 d = marshal.load(f)
20 if not d:
20 if not d:
21 break
21 break
22 yield d
22 yield d
23 except EOFError:
23 except EOFError:
24 pass
24 pass
25
25
26 def decodefilename(filename):
27 """Perforce escapes special characters @, #, *, or %
28 with %40, %23, %2A, or %25 respectively
29
30 >>> decodefilename('portable-net45%252Bnetcore45%252Bwp8%252BMonoAndroid')
31 'portable-net45%2Bnetcore45%2Bwp8%2BMonoAndroid'
32 >>> decodefilename('//Depot/Directory/%2525/%2523/%23%40.%2A')
33 '//Depot/Directory/%25/%23/#@.*'
34 """
35 replacements = [('%2A', '*'), ('%23', '#'), ('%40', '@'), ('%25', '%')]
36 for k, v in replacements:
37 filename = filename.replace(k, v)
38 return filename
39
26 class p4_source(converter_source):
40 class p4_source(converter_source):
27 def __init__(self, ui, path, revs=None):
41 def __init__(self, ui, path, revs=None):
28 super(p4_source, self).__init__(ui, path, revs=revs)
42 super(p4_source, self).__init__(ui, path, revs=revs)
29
43
30 if "/" in path and not path.startswith('//'):
44 if "/" in path and not path.startswith('//'):
31 raise NoRepo(_('%s does not look like a P4 repository') % path)
45 raise NoRepo(_('%s does not look like a P4 repository') % path)
32
46
33 checktool('p4', abort=False)
47 checktool('p4', abort=False)
34
48
35 self.p4changes = {}
49 self.p4changes = {}
36 self.heads = {}
50 self.heads = {}
37 self.changeset = {}
51 self.changeset = {}
38 self.files = {}
52 self.files = {}
39 self.copies = {}
53 self.copies = {}
40 self.tags = {}
54 self.tags = {}
41 self.lastbranch = {}
55 self.lastbranch = {}
42 self.parent = {}
56 self.parent = {}
43 self.encoding = "latin_1"
57 self.encoding = "latin_1"
44 self.depotname = {} # mapping from local name to depot name
58 self.depotname = {} # mapping from local name to depot name
45 self.localname = {} # mapping from depot name to local name
59 self.localname = {} # mapping from depot name to local name
46 self.re_type = re.compile(
60 self.re_type = re.compile(
47 "([a-z]+)?(text|binary|symlink|apple|resource|unicode|utf\d+)"
61 "([a-z]+)?(text|binary|symlink|apple|resource|unicode|utf\d+)"
48 "(\+\w+)?$")
62 "(\+\w+)?$")
49 self.re_keywords = re.compile(
63 self.re_keywords = re.compile(
50 r"\$(Id|Header|Date|DateTime|Change|File|Revision|Author)"
64 r"\$(Id|Header|Date|DateTime|Change|File|Revision|Author)"
51 r":[^$\n]*\$")
65 r":[^$\n]*\$")
52 self.re_keywords_old = re.compile("\$(Id|Header):[^$\n]*\$")
66 self.re_keywords_old = re.compile("\$(Id|Header):[^$\n]*\$")
53
67
54 if revs and len(revs) > 1:
68 if revs and len(revs) > 1:
55 raise util.Abort(_("p4 source does not support specifying "
69 raise util.Abort(_("p4 source does not support specifying "
56 "multiple revisions"))
70 "multiple revisions"))
57 self._parse(ui, path)
71 self._parse(ui, path)
58
72
59 def _parse_view(self, path):
73 def _parse_view(self, path):
60 "Read changes affecting the path"
74 "Read changes affecting the path"
61 cmd = 'p4 -G changes -s submitted %s' % util.shellquote(path)
75 cmd = 'p4 -G changes -s submitted %s' % util.shellquote(path)
62 stdout = util.popen(cmd, mode='rb')
76 stdout = util.popen(cmd, mode='rb')
63 for d in loaditer(stdout):
77 for d in loaditer(stdout):
64 c = d.get("change", None)
78 c = d.get("change", None)
65 if c:
79 if c:
66 self.p4changes[c] = True
80 self.p4changes[c] = True
67
81
68 def _parse(self, ui, path):
82 def _parse(self, ui, path):
69 "Prepare list of P4 filenames and revisions to import"
83 "Prepare list of P4 filenames and revisions to import"
70 ui.status(_('reading p4 views\n'))
84 ui.status(_('reading p4 views\n'))
71
85
72 # read client spec or view
86 # read client spec or view
73 if "/" in path:
87 if "/" in path:
74 self._parse_view(path)
88 self._parse_view(path)
75 if path.startswith("//") and path.endswith("/..."):
89 if path.startswith("//") and path.endswith("/..."):
76 views = {path[:-3]:""}
90 views = {path[:-3]:""}
77 else:
91 else:
78 views = {"//": ""}
92 views = {"//": ""}
79 else:
93 else:
80 cmd = 'p4 -G client -o %s' % util.shellquote(path)
94 cmd = 'p4 -G client -o %s' % util.shellquote(path)
81 clientspec = marshal.load(util.popen(cmd, mode='rb'))
95 clientspec = marshal.load(util.popen(cmd, mode='rb'))
82
96
83 views = {}
97 views = {}
84 for client in clientspec:
98 for client in clientspec:
85 if client.startswith("View"):
99 if client.startswith("View"):
86 sview, cview = clientspec[client].split()
100 sview, cview = clientspec[client].split()
87 self._parse_view(sview)
101 self._parse_view(sview)
88 if sview.endswith("...") and cview.endswith("..."):
102 if sview.endswith("...") and cview.endswith("..."):
89 sview = sview[:-3]
103 sview = sview[:-3]
90 cview = cview[:-3]
104 cview = cview[:-3]
91 cview = cview[2:]
105 cview = cview[2:]
92 cview = cview[cview.find("/") + 1:]
106 cview = cview[cview.find("/") + 1:]
93 views[sview] = cview
107 views[sview] = cview
94
108
95 # list of changes that affect our source files
109 # list of changes that affect our source files
96 self.p4changes = self.p4changes.keys()
110 self.p4changes = self.p4changes.keys()
97 self.p4changes.sort(key=int)
111 self.p4changes.sort(key=int)
98
112
99 # list with depot pathnames, longest first
113 # list with depot pathnames, longest first
100 vieworder = views.keys()
114 vieworder = views.keys()
101 vieworder.sort(key=len, reverse=True)
115 vieworder.sort(key=len, reverse=True)
102
116
103 # handle revision limiting
117 # handle revision limiting
104 startrev = self.ui.config('convert', 'p4.startrev', default=0)
118 startrev = self.ui.config('convert', 'p4.startrev', default=0)
105 self.p4changes = [x for x in self.p4changes
119 self.p4changes = [x for x in self.p4changes
106 if ((not startrev or int(x) >= int(startrev)) and
120 if ((not startrev or int(x) >= int(startrev)) and
107 (not self.revs or int(x) <= int(self.revs[0])))]
121 (not self.revs or int(x) <= int(self.revs[0])))]
108
122
109 # now read the full changelists to get the list of file revisions
123 # now read the full changelists to get the list of file revisions
110 ui.status(_('collecting p4 changelists\n'))
124 ui.status(_('collecting p4 changelists\n'))
111 lastid = None
125 lastid = None
112 for change in self.p4changes:
126 for change in self.p4changes:
113 cmd = "p4 -G describe -s %s" % change
127 cmd = "p4 -G describe -s %s" % change
114 stdout = util.popen(cmd, mode='rb')
128 stdout = util.popen(cmd, mode='rb')
115 d = marshal.load(stdout)
129 d = marshal.load(stdout)
116 desc = self.recode(d.get("desc", ""))
130 desc = self.recode(d.get("desc", ""))
117 shortdesc = desc.split("\n", 1)[0]
131 shortdesc = desc.split("\n", 1)[0]
118 t = '%s %s' % (d["change"], repr(shortdesc)[1:-1])
132 t = '%s %s' % (d["change"], repr(shortdesc)[1:-1])
119 ui.status(util.ellipsis(t, 80) + '\n')
133 ui.status(util.ellipsis(t, 80) + '\n')
120
134
121 if lastid:
135 if lastid:
122 parents = [lastid]
136 parents = [lastid]
123 else:
137 else:
124 parents = []
138 parents = []
125
139
126 date = (int(d["time"]), 0) # timezone not set
140 date = (int(d["time"]), 0) # timezone not set
127 c = commit(author=self.recode(d["user"]),
141 c = commit(author=self.recode(d["user"]),
128 date=util.datestr(date, '%Y-%m-%d %H:%M:%S %1%2'),
142 date=util.datestr(date, '%Y-%m-%d %H:%M:%S %1%2'),
129 parents=parents, desc=desc, branch='',
143 parents=parents, desc=desc, branch='',
130 extra={"p4": change})
144 extra={"p4": change})
131
145
132 files = []
146 files = []
133 copies = {}
147 copies = {}
134 copiedfiles = []
148 copiedfiles = []
135 i = 0
149 i = 0
136 while ("depotFile%d" % i) in d and ("rev%d" % i) in d:
150 while ("depotFile%d" % i) in d and ("rev%d" % i) in d:
137 oldname = d["depotFile%d" % i]
151 oldname = d["depotFile%d" % i]
138 filename = None
152 filename = None
139 for v in vieworder:
153 for v in vieworder:
140 if oldname.lower().startswith(v.lower()):
154 if oldname.lower().startswith(v.lower()):
141 filename = views[v] + oldname[len(v):]
155 filename = decodefilename(views[v] + oldname[len(v):])
142 break
156 break
143 if filename:
157 if filename:
144 files.append((filename, d["rev%d" % i]))
158 files.append((filename, d["rev%d" % i]))
145 self.depotname[filename] = oldname
159 self.depotname[filename] = oldname
146 if (d.get("action%d" % i) == "move/add"):
160 if (d.get("action%d" % i) == "move/add"):
147 copiedfiles.append(filename)
161 copiedfiles.append(filename)
148 self.localname[oldname] = filename
162 self.localname[oldname] = filename
149 i += 1
163 i += 1
150
164
151 # Collect information about copied files
165 # Collect information about copied files
152 for filename in copiedfiles:
166 for filename in copiedfiles:
153 oldname = self.depotname[filename]
167 oldname = self.depotname[filename]
154
168
155 flcmd = 'p4 -G filelog %s' \
169 flcmd = 'p4 -G filelog %s' \
156 % util.shellquote(oldname)
170 % util.shellquote(oldname)
157 flstdout = util.popen(flcmd, mode='rb')
171 flstdout = util.popen(flcmd, mode='rb')
158
172
159 copiedfilename = None
173 copiedfilename = None
160 for d in loaditer(flstdout):
174 for d in loaditer(flstdout):
161 copiedoldname = None
175 copiedoldname = None
162
176
163 i = 0
177 i = 0
164 while ("change%d" % i) in d:
178 while ("change%d" % i) in d:
165 if (d["change%d" % i] == change and
179 if (d["change%d" % i] == change and
166 d["action%d" % i] == "move/add"):
180 d["action%d" % i] == "move/add"):
167 j = 0
181 j = 0
168 while ("file%d,%d" % (i, j)) in d:
182 while ("file%d,%d" % (i, j)) in d:
169 if d["how%d,%d" % (i, j)] == "moved from":
183 if d["how%d,%d" % (i, j)] == "moved from":
170 copiedoldname = d["file%d,%d" % (i, j)]
184 copiedoldname = d["file%d,%d" % (i, j)]
171 break
185 break
172 j += 1
186 j += 1
173 i += 1
187 i += 1
174
188
175 if copiedoldname and copiedoldname in self.localname:
189 if copiedoldname and copiedoldname in self.localname:
176 copiedfilename = self.localname[copiedoldname]
190 copiedfilename = self.localname[copiedoldname]
177 break
191 break
178
192
179 if copiedfilename:
193 if copiedfilename:
180 copies[filename] = copiedfilename
194 copies[filename] = copiedfilename
181 else:
195 else:
182 ui.warn(_("cannot find source for copied file: %s@%s\n")
196 ui.warn(_("cannot find source for copied file: %s@%s\n")
183 % (filename, change))
197 % (filename, change))
184
198
185 self.changeset[change] = c
199 self.changeset[change] = c
186 self.files[change] = files
200 self.files[change] = files
187 self.copies[change] = copies
201 self.copies[change] = copies
188 lastid = change
202 lastid = change
189
203
190 if lastid:
204 if lastid:
191 self.heads = [lastid]
205 self.heads = [lastid]
192
206
193 def getheads(self):
207 def getheads(self):
194 return self.heads
208 return self.heads
195
209
196 def getfile(self, name, rev):
210 def getfile(self, name, rev):
197 cmd = 'p4 -G print %s' \
211 cmd = 'p4 -G print %s' \
198 % util.shellquote("%s#%s" % (self.depotname[name], rev))
212 % util.shellquote("%s#%s" % (self.depotname[name], rev))
199
213
200 lasterror = None
214 lasterror = None
201 while True:
215 while True:
202 stdout = util.popen(cmd, mode='rb')
216 stdout = util.popen(cmd, mode='rb')
203
217
204 mode = None
218 mode = None
205 contents = ""
219 contents = ""
206 keywords = None
220 keywords = None
207
221
208 for d in loaditer(stdout):
222 for d in loaditer(stdout):
209 code = d["code"]
223 code = d["code"]
210 data = d.get("data")
224 data = d.get("data")
211
225
212 if code == "error":
226 if code == "error":
213 # if this is the first time error happened
227 # if this is the first time error happened
214 # re-attempt getting the file
228 # re-attempt getting the file
215 if not lasterror:
229 if not lasterror:
216 lasterror = IOError(d["generic"], data)
230 lasterror = IOError(d["generic"], data)
217 # this will exit inner-most for-loop
231 # this will exit inner-most for-loop
218 break
232 break
219 else:
233 else:
220 raise lasterror
234 raise lasterror
221
235
222 elif code == "stat":
236 elif code == "stat":
223 action = d.get("action")
237 action = d.get("action")
224 if action in ["purge", "delete", "move/delete"]:
238 if action in ["purge", "delete", "move/delete"]:
225 return None, None
239 return None, None
226 p4type = self.re_type.match(d["type"])
240 p4type = self.re_type.match(d["type"])
227 if p4type:
241 if p4type:
228 mode = ""
242 mode = ""
229 flags = ((p4type.group(1) or "")
243 flags = ((p4type.group(1) or "")
230 + (p4type.group(3) or ""))
244 + (p4type.group(3) or ""))
231 if "x" in flags:
245 if "x" in flags:
232 mode = "x"
246 mode = "x"
233 if p4type.group(2) == "symlink":
247 if p4type.group(2) == "symlink":
234 mode = "l"
248 mode = "l"
235 if "ko" in flags:
249 if "ko" in flags:
236 keywords = self.re_keywords_old
250 keywords = self.re_keywords_old
237 elif "k" in flags:
251 elif "k" in flags:
238 keywords = self.re_keywords
252 keywords = self.re_keywords
239
253
240 elif code == "text" or code == "binary":
254 elif code == "text" or code == "binary":
241 contents += data
255 contents += data
242
256
243 lasterror = None
257 lasterror = None
244
258
245 if not lasterror:
259 if not lasterror:
246 break
260 break
247
261
248 if mode is None:
262 if mode is None:
249 return None, None
263 return None, None
250
264
251 if keywords:
265 if keywords:
252 contents = keywords.sub("$\\1$", contents)
266 contents = keywords.sub("$\\1$", contents)
253 if mode == "l" and contents.endswith("\n"):
267 if mode == "l" and contents.endswith("\n"):
254 contents = contents[:-1]
268 contents = contents[:-1]
255
269
256 return contents, mode
270 return contents, mode
257
271
258 def getchanges(self, rev, full):
272 def getchanges(self, rev, full):
259 if full:
273 if full:
260 raise util.Abort(_("convert from p4 do not support --full"))
274 raise util.Abort(_("convert from p4 do not support --full"))
261 return self.files[rev], self.copies[rev], set()
275 return self.files[rev], self.copies[rev], set()
262
276
263 def getcommit(self, rev):
277 def getcommit(self, rev):
264 return self.changeset[rev]
278 return self.changeset[rev]
265
279
266 def gettags(self):
280 def gettags(self):
267 return self.tags
281 return self.tags
268
282
269 def getchangedfiles(self, rev, i):
283 def getchangedfiles(self, rev, i):
270 return sorted([x[0] for x in self.files[rev]])
284 return sorted([x[0] for x in self.files[rev]])
@@ -1,37 +1,38 b''
1 # this is hack to make sure no escape characters are inserted into the output
1 # this is hack to make sure no escape characters are inserted into the output
2 import os, sys
2 import os, sys
3 if 'TERM' in os.environ:
3 if 'TERM' in os.environ:
4 del os.environ['TERM']
4 del os.environ['TERM']
5 import doctest
5 import doctest
6
6
7 def testmod(name, optionflags=0, testtarget=None):
7 def testmod(name, optionflags=0, testtarget=None):
8 __import__(name)
8 __import__(name)
9 mod = sys.modules[name]
9 mod = sys.modules[name]
10 if testtarget is not None:
10 if testtarget is not None:
11 mod = getattr(mod, testtarget)
11 mod = getattr(mod, testtarget)
12 doctest.testmod(mod, optionflags=optionflags)
12 doctest.testmod(mod, optionflags=optionflags)
13
13
14 testmod('mercurial.changelog')
14 testmod('mercurial.changelog')
15 testmod('mercurial.dagparser', optionflags=doctest.NORMALIZE_WHITESPACE)
15 testmod('mercurial.dagparser', optionflags=doctest.NORMALIZE_WHITESPACE)
16 testmod('mercurial.dispatch')
16 testmod('mercurial.dispatch')
17 testmod('mercurial.encoding')
17 testmod('mercurial.encoding')
18 testmod('mercurial.hg')
18 testmod('mercurial.hg')
19 testmod('mercurial.hgweb.hgwebdir_mod')
19 testmod('mercurial.hgweb.hgwebdir_mod')
20 testmod('mercurial.match')
20 testmod('mercurial.match')
21 testmod('mercurial.minirst')
21 testmod('mercurial.minirst')
22 testmod('mercurial.patch')
22 testmod('mercurial.patch')
23 testmod('mercurial.pathutil')
23 testmod('mercurial.pathutil')
24 testmod('mercurial.parser')
24 testmod('mercurial.parser')
25 testmod('mercurial.revset')
25 testmod('mercurial.revset')
26 testmod('mercurial.store')
26 testmod('mercurial.store')
27 testmod('mercurial.subrepo')
27 testmod('mercurial.subrepo')
28 testmod('mercurial.templatefilters')
28 testmod('mercurial.templatefilters')
29 testmod('mercurial.templater')
29 testmod('mercurial.templater')
30 testmod('mercurial.ui')
30 testmod('mercurial.ui')
31 testmod('mercurial.url')
31 testmod('mercurial.url')
32 testmod('mercurial.util')
32 testmod('mercurial.util')
33 testmod('mercurial.util', testtarget='platform')
33 testmod('mercurial.util', testtarget='platform')
34 testmod('hgext.convert.cvsps')
34 testmod('hgext.convert.cvsps')
35 testmod('hgext.convert.filemap')
35 testmod('hgext.convert.filemap')
36 testmod('hgext.convert.p4')
36 testmod('hgext.convert.subversion')
37 testmod('hgext.convert.subversion')
37 testmod('hgext.mq')
38 testmod('hgext.mq')
General Comments 0
You need to be logged in to leave comments. Login now