httprepo.py
454 lines
| 15.9 KiB
| text/x-python
|
PythonLexer
/ mercurial / httprepo.py
mpm@selenic.com
|
r1089 | # httprepo.py - HTTP repository proxy classes for mercurial | ||
# | ||||
Vadim Gelfer
|
r2859 | # Copyright 2005, 2006 Matt Mackall <mpm@selenic.com> | ||
# Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com> | ||||
mpm@selenic.com
|
r1089 | # | ||
# This software may be used and distributed according to the terms | ||||
# of the GNU General Public License, incorporated herein by reference. | ||||
from node import * | ||||
from remoterepo import * | ||||
Matt Mackall
|
r3891 | from i18n import _ | ||
Matt Mackall
|
r3877 | import hg, os, urllib, urllib2, urlparse, zlib, util, httplib | ||
import errno, keepalive, tempfile, socket, changegroup | ||||
mpm@selenic.com
|
r1089 | |||
Vadim Gelfer
|
r2447 | class passwordmgr(urllib2.HTTPPasswordMgrWithDefaultRealm): | ||
Vadim Gelfer
|
r2281 | def __init__(self, ui): | ||
Vadim Gelfer
|
r2447 | urllib2.HTTPPasswordMgrWithDefaultRealm.__init__(self) | ||
Vadim Gelfer
|
r2281 | self.ui = ui | ||
def find_user_password(self, realm, authuri): | ||||
Vadim Gelfer
|
r2447 | authinfo = urllib2.HTTPPasswordMgrWithDefaultRealm.find_user_password( | ||
Vadim Gelfer
|
r2281 | self, realm, authuri) | ||
Alexis S. L. Carvalho
|
r2556 | user, passwd = authinfo | ||
if user and passwd: | ||||
return (user, passwd) | ||||
Vadim Gelfer
|
r2281 | |||
Vadim Gelfer
|
r2446 | if not self.ui.interactive: | ||
Vadim Gelfer
|
r2337 | raise util.Abort(_('http authorization required')) | ||
Vadim Gelfer
|
r2281 | self.ui.write(_("http authorization required\n")) | ||
self.ui.status(_("realm: %s\n") % realm) | ||||
Alexis S. L. Carvalho
|
r2556 | if user: | ||
self.ui.status(_("user: %s\n") % user) | ||||
else: | ||||
user = self.ui.prompt(_("user:"), default=None) | ||||
if not passwd: | ||||
passwd = self.ui.getpass() | ||||
Vadim Gelfer
|
r2281 | |||
self.add_password(realm, authuri, user, passwd) | ||||
return (user, passwd) | ||||
Vadim Gelfer
|
r2337 | def netlocsplit(netloc): | ||
'''split [user[:passwd]@]host[:port] into 4-tuple.''' | ||||
a = netloc.find('@') | ||||
if a == -1: | ||||
user, passwd = None, None | ||||
else: | ||||
userpass, netloc = netloc[:a], netloc[a+1:] | ||||
c = userpass.find(':') | ||||
if c == -1: | ||||
user, passwd = urllib.unquote(userpass), None | ||||
else: | ||||
user = urllib.unquote(userpass[:c]) | ||||
passwd = urllib.unquote(userpass[c+1:]) | ||||
c = netloc.find(':') | ||||
if c == -1: | ||||
host, port = netloc, None | ||||
else: | ||||
host, port = netloc[:c], netloc[c+1:] | ||||
return host, port, user, passwd | ||||
def netlocunsplit(host, port, user=None, passwd=None): | ||||
'''turn host, port, user, passwd into [user[:passwd]@]host[:port].''' | ||||
if port: | ||||
hostport = host + ':' + port | ||||
else: | ||||
hostport = host | ||||
if user: | ||||
if passwd: | ||||
userpass = urllib.quote(user) + ':' + urllib.quote(passwd) | ||||
else: | ||||
userpass = urllib.quote(user) | ||||
return userpass + '@' + hostport | ||||
return hostport | ||||
Alexis S. L. Carvalho
|
r4226 | # work around a bug in Python < 2.4.2 | ||
# (it leaves a "\n" at the end of Proxy-authorization headers) | ||||
class request(urllib2.Request): | ||||
def add_header(self, key, val): | ||||
if key.lower() == 'proxy-authorization': | ||||
val = val.strip() | ||||
return urllib2.Request.add_header(self, key, val) | ||||
Benoit Boissinot
|
r4025 | class httpsendfile(file): | ||
def __len__(self): | ||||
return os.fstat(self.fileno()).st_size | ||||
Vadim Gelfer
|
r2465 | |||
Benoit Boissinot
|
r4025 | def _gen_sendfile(connection): | ||
def _sendfile(self, data): | ||||
# send a file | ||||
if isinstance(data, httpsendfile): | ||||
Vadim Gelfer
|
r2465 | # if auth required, some data sent twice, so rewind here | ||
data.seek(0) | ||||
for chunk in util.filechunkiter(data): | ||||
Benoit Boissinot
|
r4025 | connection.send(self, chunk) | ||
else: | ||||
connection.send(self, data) | ||||
return _sendfile | ||||
class httpconnection(keepalive.HTTPConnection): | ||||
# must be able to send big bundle as stream. | ||||
send = _gen_sendfile(keepalive.HTTPConnection) | ||||
Vadim Gelfer
|
r2465 | |||
Alexis S. L. Carvalho
|
r2569 | class basehttphandler(keepalive.HTTPHandler): | ||
Vadim Gelfer
|
r2465 | def http_open(self, req): | ||
return self.do_open(httpconnection, req) | ||||
Alexis S. L. Carvalho
|
r2569 | has_https = hasattr(urllib2, 'HTTPSHandler') | ||
if has_https: | ||||
class httpsconnection(httplib.HTTPSConnection): | ||||
response_class = keepalive.HTTPResponse | ||||
# must be able to send big bundle as stream. | ||||
Benoit Boissinot
|
r4025 | send = _gen_sendfile(httplib.HTTPSConnection) | ||
Alexis S. L. Carvalho
|
r2557 | |||
Alexis S. L. Carvalho
|
r2569 | class httphandler(basehttphandler, urllib2.HTTPSHandler): | ||
def https_open(self, req): | ||||
return self.do_open(httpsconnection, req) | ||||
else: | ||||
class httphandler(basehttphandler): | ||||
pass | ||||
Alexis S. L. Carvalho
|
r2557 | |||
Alexis S. L. Carvalho
|
r4678 | # In python < 2.5 AbstractDigestAuthHandler raises a ValueError if | ||
# it doesn't know about the auth type requested. This can happen if | ||||
# somebody is using BasicAuth and types a bad password. | ||||
class httpdigestauthhandler(urllib2.HTTPDigestAuthHandler): | ||||
def http_error_auth_reqed(self, auth_header, host, req, headers): | ||||
try: | ||||
return urllib2.HTTPDigestAuthHandler.http_error_auth_reqed( | ||||
self, auth_header, host, req, headers) | ||||
except ValueError, inst: | ||||
arg = inst.args[0] | ||||
if arg.startswith("AbstractDigestAuthHandler doesn't know "): | ||||
return | ||||
raise | ||||
Matt Mackall
|
r3661 | def zgenerator(f): | ||
zd = zlib.decompressobj() | ||||
try: | ||||
for chunk in util.filechunkiter(f): | ||||
yield zd.decompress(chunk) | ||||
except httplib.HTTPException, inst: | ||||
raise IOError(None, _('connection ended unexpectedly')) | ||||
yield zd.flush() | ||||
Alexis S. L. Carvalho
|
r5066 | _safe = ('abcdefghijklmnopqrstuvwxyz' | ||
'ABCDEFGHIJKLMNOPQRSTUVWXYZ' | ||||
'0123456789' '_.-/') | ||||
_safeset = None | ||||
_hex = None | ||||
def quotepath(path): | ||||
'''quote the path part of a URL | ||||
This is similar to urllib.quote, but it also tries to avoid | ||||
quoting things twice (inspired by wget): | ||||
>>> quotepath('abc def') | ||||
'abc%20def' | ||||
>>> quotepath('abc%20def') | ||||
'abc%20def' | ||||
>>> quotepath('abc%20 def') | ||||
'abc%20%20def' | ||||
>>> quotepath('abc def%20') | ||||
'abc%20def%20' | ||||
>>> quotepath('abc def%2') | ||||
'abc%20def%252' | ||||
>>> quotepath('abc def%') | ||||
'abc%20def%25' | ||||
''' | ||||
global _safeset, _hex | ||||
if _safeset is None: | ||||
_safeset = util.set(_safe) | ||||
_hex = util.set('abcdefABCDEF0123456789') | ||||
l = list(path) | ||||
for i in xrange(len(l)): | ||||
c = l[i] | ||||
if c == '%' and i + 2 < len(l) and (l[i+1] in _hex and l[i+2] in _hex): | ||||
pass | ||||
elif c not in _safeset: | ||||
l[i] = '%%%02X' % ord(c) | ||||
return ''.join(l) | ||||
mpm@selenic.com
|
r1089 | class httprepository(remoterepository): | ||
def __init__(self, ui, path): | ||||
Vadim Gelfer
|
r2673 | self.path = path | ||
Vadim Gelfer
|
r2442 | self.caps = None | ||
Andrei Vermel
|
r4132 | self.handler = None | ||
Vadim Gelfer
|
r2337 | scheme, netloc, urlpath, query, frag = urlparse.urlsplit(path) | ||
if query or frag: | ||||
raise util.Abort(_('unsupported URL component: "%s"') % | ||||
(query or frag)) | ||||
Alexis S. L. Carvalho
|
r5066 | if not urlpath: | ||
urlpath = '/' | ||||
urlpath = quotepath(urlpath) | ||||
Vadim Gelfer
|
r2337 | host, port, user, passwd = netlocsplit(netloc) | ||
# urllib cannot handle URLs with embedded user or passwd | ||||
Vadim Gelfer
|
r2673 | self._url = urlparse.urlunsplit((scheme, netlocunsplit(host, port), | ||
urlpath, '', '')) | ||||
mpm@selenic.com
|
r1089 | self.ui = ui | ||
Alexis S. L. Carvalho
|
r5066 | self.ui.debug(_('using %s\n') % self._url) | ||
Vadim Gelfer
|
r2337 | |||
proxyurl = ui.config("http_proxy", "host") or os.getenv('http_proxy') | ||||
Benoit Boissinot
|
r3131 | # XXX proxyauthinfo = None | ||
Andrei Vermel
|
r4132 | self.handler = httphandler() | ||
handlers = [self.handler] | ||||
Vadim Gelfer
|
r2337 | |||
if proxyurl: | ||||
# proxy can be proper url or host[:port] | ||||
if not (proxyurl.startswith('http:') or | ||||
proxyurl.startswith('https:')): | ||||
proxyurl = 'http://' + proxyurl + '/' | ||||
snpqf = urlparse.urlsplit(proxyurl) | ||||
proxyscheme, proxynetloc, proxypath, proxyquery, proxyfrag = snpqf | ||||
hpup = netlocsplit(proxynetloc) | ||||
proxyhost, proxyport, proxyuser, proxypasswd = hpup | ||||
if not proxyuser: | ||||
proxyuser = ui.config("http_proxy", "user") | ||||
proxypasswd = ui.config("http_proxy", "passwd") | ||||
mpm@selenic.com
|
r1089 | |||
Vadim Gelfer
|
r2337 | # see if we should use a proxy for this url | ||
no_list = [ "localhost", "127.0.0.1" ] | ||||
Thomas Arendsen Hein
|
r2501 | no_list.extend([p.lower() for | ||
p in ui.configlist("http_proxy", "no")]) | ||||
Vadim Gelfer
|
r2337 | no_list.extend([p.strip().lower() for | ||
p in os.getenv("no_proxy", '').split(',') | ||||
if p.strip()]) | ||||
# "http_proxy.always" config is for running tests on localhost | ||||
if (not ui.configbool("http_proxy", "always") and | ||||
host.lower() in no_list): | ||||
ui.debug(_('disabling proxy for %s\n') % host) | ||||
else: | ||||
proxyurl = urlparse.urlunsplit(( | ||||
proxyscheme, netlocunsplit(proxyhost, proxyport, | ||||
proxyuser, proxypasswd or ''), | ||||
proxypath, proxyquery, proxyfrag)) | ||||
Alexis S. L. Carvalho
|
r3608 | handlers.append(urllib2.ProxyHandler({scheme: proxyurl})) | ||
Thomas Arendsen Hein
|
r3223 | ui.debug(_('proxying through http://%s:%s\n') % | ||
TK Soh
|
r3170 | (proxyhost, proxyport)) | ||
mpm@selenic.com
|
r1089 | |||
Vadim Gelfer
|
r2337 | # urllib2 takes proxy values from the environment and those | ||
# will take precedence if found, so drop them | ||||
mpm@selenic.com
|
r1089 | for env in ["HTTP_PROXY", "http_proxy", "no_proxy"]: | ||
try: | ||||
if os.environ.has_key(env): | ||||
del os.environ[env] | ||||
except OSError: | ||||
pass | ||||
Vadim Gelfer
|
r2337 | passmgr = passwordmgr(ui) | ||
if user: | ||||
Alexis S. L. Carvalho
|
r2556 | ui.debug(_('http auth: user %s, password %s\n') % | ||
(user, passwd and '*' * len(passwd) or 'not set')) | ||||
Vadim Gelfer
|
r2337 | passmgr.add_password(None, host, user, passwd or '') | ||
mpm@selenic.com
|
r1089 | |||
Alexis S. L. Carvalho
|
r3608 | handlers.extend((urllib2.HTTPBasicAuthHandler(passmgr), | ||
Alexis S. L. Carvalho
|
r4678 | httpdigestauthhandler(passmgr))) | ||
Alexis S. L. Carvalho
|
r3608 | opener = urllib2.build_opener(*handlers) | ||
Vadim Gelfer
|
r2281 | |||
Matt Mackall
|
r1359 | # 1.0 here is the _protocol_ version | ||
opener.addheaders = [('User-agent', 'mercurial/proto-1.0')] | ||||
mpm@selenic.com
|
r1089 | urllib2.install_opener(opener) | ||
Thomas Arendsen Hein
|
r4516 | |||
Andrei Vermel
|
r4132 | def __del__(self): | ||
if self.handler: | ||||
self.handler.close_all() | ||||
self.handler = None | ||||
mpm@selenic.com
|
r1089 | |||
Vadim Gelfer
|
r2673 | def url(self): | ||
return self.path | ||||
Vadim Gelfer
|
r2442 | # look up capabilities only when needed | ||
def get_caps(self): | ||||
if self.caps is None: | ||||
try: | ||||
self.caps = self.do_read('capabilities').split() | ||||
except hg.RepoError: | ||||
self.caps = () | ||||
Vadim Gelfer
|
r2465 | self.ui.debug(_('capabilities: %s\n') % | ||
(' '.join(self.caps or ['none']))) | ||||
Vadim Gelfer
|
r2442 | return self.caps | ||
capabilities = property(get_caps) | ||||
Vadim Gelfer
|
r1870 | def lock(self): | ||
raise util.Abort(_('operation not supported over http')) | ||||
mpm@selenic.com
|
r1089 | def do_cmd(self, cmd, **args): | ||
Vadim Gelfer
|
r2465 | data = args.pop('data', None) | ||
headers = args.pop('headers', {}) | ||||
Benoit Boissinot
|
r1402 | self.ui.debug(_("sending %s command\n") % cmd) | ||
mpm@selenic.com
|
r1089 | q = {"cmd": cmd} | ||
q.update(args) | ||||
Benoit Boissinot
|
r3562 | qs = '?%s' % urllib.urlencode(q) | ||
cu = "%s%s" % (self._url, qs) | ||||
Thomas Arendsen Hein
|
r2294 | try: | ||
Thomas Arendsen Hein
|
r3567 | if data: | ||
Alexis S. L. Carvalho
|
r3608 | self.ui.debug(_("sending %s bytes\n") % | ||
headers.get('content-length', 'X')) | ||||
Alexis S. L. Carvalho
|
r4226 | resp = urllib2.urlopen(request(cu, data, headers)) | ||
Vadim Gelfer
|
r2467 | except urllib2.HTTPError, inst: | ||
if inst.code == 401: | ||||
raise util.Abort(_('authorization failed')) | ||||
raise | ||||
Thomas Arendsen Hein
|
r2294 | except httplib.HTTPException, inst: | ||
Vadim Gelfer
|
r2336 | self.ui.debug(_('http error while sending %s command\n') % cmd) | ||
self.ui.print_exc() | ||||
raise IOError(None, inst) | ||||
Thomas Arendsen Hein
|
r3399 | except IndexError: | ||
# this only happens with Python 2.3, later versions raise URLError | ||||
raise util.Abort(_('http error, possibly caused by proxy setting')) | ||||
Benoit Boissinot
|
r3562 | # record the url we got redirected to | ||
Thomas Arendsen Hein
|
r3570 | resp_url = resp.geturl() | ||
if resp_url.endswith(qs): | ||||
resp_url = resp_url[:-len(qs)] | ||||
if self._url != resp_url: | ||||
self.ui.status(_('real URL is %s\n') % resp_url) | ||||
self._url = resp_url | ||||
Vadim Gelfer
|
r2435 | try: | ||
proto = resp.getheader('content-type') | ||||
except AttributeError: | ||||
proto = resp.headers['content-type'] | ||||
mpm@selenic.com
|
r1089 | |||
# accept old "text/plain" and "application/hg-changegroup" for now | ||||
Thomas Arendsen Hein
|
r4633 | if not (proto.startswith('application/mercurial-') or | ||
proto.startswith('text/plain') or | ||||
proto.startswith('application/hg-changegroup')): | ||||
Thomas Arendsen Hein
|
r4739 | self.ui.debug(_("Requested URL: '%s'\n") % cu) | ||
Thomas Arendsen Hein
|
r4633 | raise hg.RepoError(_("'%s' does not appear to be an hg repository") | ||
% self._url) | ||||
mpm@selenic.com
|
r1089 | |||
Benoit Boissinot
|
r4012 | if proto.startswith('application/mercurial-'): | ||
try: | ||||
Thomas Arendsen Hein
|
r4356 | version = proto.split('-', 1)[1] | ||
version_info = tuple([int(n) for n in version.split('.')]) | ||||
Benoit Boissinot
|
r4012 | except ValueError: | ||
raise hg.RepoError(_("'%s' sent a broken Content-type " | ||||
"header (%s)") % (self._url, proto)) | ||||
Thomas Arendsen Hein
|
r4356 | if version_info > (0, 1): | ||
Benoit Boissinot
|
r1402 | raise hg.RepoError(_("'%s' uses newer protocol %s") % | ||
Vadim Gelfer
|
r2673 | (self._url, version)) | ||
mpm@selenic.com
|
r1089 | |||
return resp | ||||
Vadim Gelfer
|
r2435 | def do_read(self, cmd, **args): | ||
fp = self.do_cmd(cmd, **args) | ||||
try: | ||||
return fp.read() | ||||
finally: | ||||
# if using keepalive, allow connection to be reused | ||||
fp.close() | ||||
Eric Hopper
|
r3444 | def lookup(self, key): | ||
Matt Mackall
|
r3445 | d = self.do_cmd("lookup", key = key).read() | ||
success, data = d[:-1].split(' ', 1) | ||||
if int(success): | ||||
return bin(data) | ||||
raise hg.RepoError(data) | ||||
Eric Hopper
|
r3444 | |||
mpm@selenic.com
|
r1089 | def heads(self): | ||
Vadim Gelfer
|
r2435 | d = self.do_read("heads") | ||
mpm@selenic.com
|
r1089 | try: | ||
return map(bin, d[:-1].split(" ")) | ||||
except: | ||||
Thomas Arendsen Hein
|
r3565 | raise util.UnexpectedOutput(_("unexpected response:"), d) | ||
mpm@selenic.com
|
r1089 | |||
def branches(self, nodes): | ||||
n = " ".join(map(hex, nodes)) | ||||
Vadim Gelfer
|
r2435 | d = self.do_read("branches", nodes=n) | ||
mpm@selenic.com
|
r1089 | try: | ||
br = [ tuple(map(bin, b.split(" "))) for b in d.splitlines() ] | ||||
return br | ||||
except: | ||||
Thomas Arendsen Hein
|
r3565 | raise util.UnexpectedOutput(_("unexpected response:"), d) | ||
mpm@selenic.com
|
r1089 | |||
def between(self, pairs): | ||||
n = "\n".join(["-".join(map(hex, p)) for p in pairs]) | ||||
Vadim Gelfer
|
r2435 | d = self.do_read("between", pairs=n) | ||
mpm@selenic.com
|
r1089 | try: | ||
p = [ l and map(bin, l.split(" ")) or [] for l in d.splitlines() ] | ||||
return p | ||||
except: | ||||
Thomas Arendsen Hein
|
r3565 | raise util.UnexpectedOutput(_("unexpected response:"), d) | ||
mpm@selenic.com
|
r1089 | |||
Vadim Gelfer
|
r1736 | def changegroup(self, nodes, kind): | ||
mpm@selenic.com
|
r1089 | n = " ".join(map(hex, nodes)) | ||
f = self.do_cmd("changegroup", roots=n) | ||||
Matt Mackall
|
r3661 | return util.chunkbuffer(zgenerator(f)) | ||
Eric Hopper
|
r3444 | |||
def changegroupsubset(self, bases, heads, source): | ||||
baselst = " ".join([hex(n) for n in bases]) | ||||
headlst = " ".join([hex(n) for n in heads]) | ||||
f = self.do_cmd("changegroupsubset", bases=baselst, heads=headlst) | ||||
Matt Mackall
|
r3661 | return util.chunkbuffer(zgenerator(f)) | ||
mpm@selenic.com
|
r1089 | |||
Vadim Gelfer
|
r2439 | def unbundle(self, cg, heads, source): | ||
Vadim Gelfer
|
r2465 | # have to stream bundle to a temp file because we do not have | ||
# http 1.1 chunked transfer. | ||||
Matt Mackall
|
r3662 | type = "" | ||
types = self.capable('unbundle') | ||||
Alexis S. L. Carvalho
|
r3703 | # servers older than d1b16a746db6 will send 'unbundle' as a | ||
# boolean capability | ||||
try: | ||||
types = types.split(',') | ||||
except AttributeError: | ||||
types = [""] | ||||
Matt Mackall
|
r3662 | if types: | ||
Alexis S. L. Carvalho
|
r3703 | for x in types: | ||
Matt Mackall
|
r3662 | if x in changegroup.bundletypes: | ||
type = x | ||||
break | ||||
Thomas Arendsen Hein
|
r3613 | |||
Matt Mackall
|
r3662 | tempname = changegroup.writebundle(cg, None, type) | ||
Benoit Boissinot
|
r4025 | fp = httpsendfile(tempname, "rb") | ||
Vadim Gelfer
|
r2465 | try: | ||
try: | ||||
Vadim Gelfer
|
r2467 | rfp = self.do_cmd( | ||
'unbundle', data=fp, | ||||
Benoit Boissinot
|
r4025 | headers={'content-type': 'application/octet-stream'}, | ||
Vadim Gelfer
|
r2467 | heads=' '.join(map(hex, heads))) | ||
try: | ||||
ret = int(rfp.readline()) | ||||
self.ui.write(rfp.read()) | ||||
return ret | ||||
finally: | ||||
rfp.close() | ||||
except socket.error, err: | ||||
if err[0] in (errno.ECONNRESET, errno.EPIPE): | ||||
Thomas Arendsen Hein
|
r3072 | raise util.Abort(_('push failed: %s') % err[1]) | ||
Vadim Gelfer
|
r2467 | raise util.Abort(err[1]) | ||
Vadim Gelfer
|
r2465 | finally: | ||
fp.close() | ||||
os.unlink(tempname) | ||||
Vadim Gelfer
|
r2439 | |||
Vadim Gelfer
|
r2612 | def stream_out(self): | ||
return self.do_cmd('stream_out') | ||||
mpm@selenic.com
|
r1089 | class httpsrepository(httprepository): | ||
Alexis S. L. Carvalho
|
r2569 | def __init__(self, ui, path): | ||
if not has_https: | ||||
raise util.Abort(_('Python support for SSL and HTTPS ' | ||||
'is not installed')) | ||||
httprepository.__init__(self, ui, path) | ||||
Vadim Gelfer
|
r2740 | |||
def instance(ui, path, create): | ||||
if create: | ||||
raise util.Abort(_('cannot create new http repository')) | ||||
if path.startswith('https:'): | ||||
return httpsrepository(ui, path) | ||||
return httprepository(ui, path) | ||||