|
|
# httprepo.py - HTTP repository proxy classes for mercurial
|
|
|
#
|
|
|
# Copyright 2005, 2006 Matt Mackall <mpm@selenic.com>
|
|
|
# Copyright 2006 Vadim Gelfer <vadim.gelfer@gmail.com>
|
|
|
#
|
|
|
# This software may be used and distributed according to the terms
|
|
|
# of the GNU General Public License, incorporated herein by reference.
|
|
|
|
|
|
from node import *
|
|
|
from remoterepo import *
|
|
|
from i18n import _
|
|
|
import repo, os, urllib, urllib2, urlparse, zlib, util, httplib
|
|
|
import errno, keepalive, tempfile, socket, changegroup
|
|
|
|
|
|
class passwordmgr(urllib2.HTTPPasswordMgrWithDefaultRealm):
|
|
|
def __init__(self, ui):
|
|
|
urllib2.HTTPPasswordMgrWithDefaultRealm.__init__(self)
|
|
|
self.ui = ui
|
|
|
|
|
|
def find_user_password(self, realm, authuri):
|
|
|
authinfo = urllib2.HTTPPasswordMgrWithDefaultRealm.find_user_password(
|
|
|
self, realm, authuri)
|
|
|
user, passwd = authinfo
|
|
|
if user and passwd:
|
|
|
return (user, passwd)
|
|
|
|
|
|
if not self.ui.interactive:
|
|
|
raise util.Abort(_('http authorization required'))
|
|
|
|
|
|
self.ui.write(_("http authorization required\n"))
|
|
|
self.ui.status(_("realm: %s\n") % realm)
|
|
|
if user:
|
|
|
self.ui.status(_("user: %s\n") % user)
|
|
|
else:
|
|
|
user = self.ui.prompt(_("user:"), default=None)
|
|
|
|
|
|
if not passwd:
|
|
|
passwd = self.ui.getpass()
|
|
|
|
|
|
self.add_password(realm, authuri, user, passwd)
|
|
|
return (user, passwd)
|
|
|
|
|
|
def netlocsplit(netloc):
|
|
|
'''split [user[:passwd]@]host[:port] into 4-tuple.'''
|
|
|
|
|
|
a = netloc.find('@')
|
|
|
if a == -1:
|
|
|
user, passwd = None, None
|
|
|
else:
|
|
|
userpass, netloc = netloc[:a], netloc[a+1:]
|
|
|
c = userpass.find(':')
|
|
|
if c == -1:
|
|
|
user, passwd = urllib.unquote(userpass), None
|
|
|
else:
|
|
|
user = urllib.unquote(userpass[:c])
|
|
|
passwd = urllib.unquote(userpass[c+1:])
|
|
|
c = netloc.find(':')
|
|
|
if c == -1:
|
|
|
host, port = netloc, None
|
|
|
else:
|
|
|
host, port = netloc[:c], netloc[c+1:]
|
|
|
return host, port, user, passwd
|
|
|
|
|
|
def netlocunsplit(host, port, user=None, passwd=None):
|
|
|
'''turn host, port, user, passwd into [user[:passwd]@]host[:port].'''
|
|
|
if port:
|
|
|
hostport = host + ':' + port
|
|
|
else:
|
|
|
hostport = host
|
|
|
if user:
|
|
|
if passwd:
|
|
|
userpass = urllib.quote(user) + ':' + urllib.quote(passwd)
|
|
|
else:
|
|
|
userpass = urllib.quote(user)
|
|
|
return userpass + '@' + hostport
|
|
|
return hostport
|
|
|
|
|
|
# work around a bug in Python < 2.4.2
|
|
|
# (it leaves a "\n" at the end of Proxy-authorization headers)
|
|
|
class request(urllib2.Request):
|
|
|
def add_header(self, key, val):
|
|
|
if key.lower() == 'proxy-authorization':
|
|
|
val = val.strip()
|
|
|
return urllib2.Request.add_header(self, key, val)
|
|
|
|
|
|
class httpsendfile(file):
|
|
|
def __len__(self):
|
|
|
return os.fstat(self.fileno()).st_size
|
|
|
|
|
|
def _gen_sendfile(connection):
|
|
|
def _sendfile(self, data):
|
|
|
# send a file
|
|
|
if isinstance(data, httpsendfile):
|
|
|
# if auth required, some data sent twice, so rewind here
|
|
|
data.seek(0)
|
|
|
for chunk in util.filechunkiter(data):
|
|
|
connection.send(self, chunk)
|
|
|
else:
|
|
|
connection.send(self, data)
|
|
|
return _sendfile
|
|
|
|
|
|
class httpconnection(keepalive.HTTPConnection):
|
|
|
# must be able to send big bundle as stream.
|
|
|
send = _gen_sendfile(keepalive.HTTPConnection)
|
|
|
|
|
|
class basehttphandler(keepalive.HTTPHandler):
|
|
|
def http_open(self, req):
|
|
|
return self.do_open(httpconnection, req)
|
|
|
|
|
|
has_https = hasattr(urllib2, 'HTTPSHandler')
|
|
|
if has_https:
|
|
|
class httpsconnection(httplib.HTTPSConnection):
|
|
|
response_class = keepalive.HTTPResponse
|
|
|
# must be able to send big bundle as stream.
|
|
|
send = _gen_sendfile(httplib.HTTPSConnection)
|
|
|
|
|
|
class httphandler(basehttphandler, urllib2.HTTPSHandler):
|
|
|
def https_open(self, req):
|
|
|
return self.do_open(httpsconnection, req)
|
|
|
else:
|
|
|
class httphandler(basehttphandler):
|
|
|
pass
|
|
|
|
|
|
# In python < 2.5 AbstractDigestAuthHandler raises a ValueError if
|
|
|
# it doesn't know about the auth type requested. This can happen if
|
|
|
# somebody is using BasicAuth and types a bad password.
|
|
|
class httpdigestauthhandler(urllib2.HTTPDigestAuthHandler):
|
|
|
def http_error_auth_reqed(self, auth_header, host, req, headers):
|
|
|
try:
|
|
|
return urllib2.HTTPDigestAuthHandler.http_error_auth_reqed(
|
|
|
self, auth_header, host, req, headers)
|
|
|
except ValueError, inst:
|
|
|
arg = inst.args[0]
|
|
|
if arg.startswith("AbstractDigestAuthHandler doesn't know "):
|
|
|
return
|
|
|
raise
|
|
|
|
|
|
def zgenerator(f):
|
|
|
zd = zlib.decompressobj()
|
|
|
try:
|
|
|
for chunk in util.filechunkiter(f):
|
|
|
yield zd.decompress(chunk)
|
|
|
except httplib.HTTPException, inst:
|
|
|
raise IOError(None, _('connection ended unexpectedly'))
|
|
|
yield zd.flush()
|
|
|
|
|
|
_safe = ('abcdefghijklmnopqrstuvwxyz'
|
|
|
'ABCDEFGHIJKLMNOPQRSTUVWXYZ'
|
|
|
'0123456789' '_.-/')
|
|
|
_safeset = None
|
|
|
_hex = None
|
|
|
def quotepath(path):
|
|
|
'''quote the path part of a URL
|
|
|
|
|
|
This is similar to urllib.quote, but it also tries to avoid
|
|
|
quoting things twice (inspired by wget):
|
|
|
|
|
|
>>> quotepath('abc def')
|
|
|
'abc%20def'
|
|
|
>>> quotepath('abc%20def')
|
|
|
'abc%20def'
|
|
|
>>> quotepath('abc%20 def')
|
|
|
'abc%20%20def'
|
|
|
>>> quotepath('abc def%20')
|
|
|
'abc%20def%20'
|
|
|
>>> quotepath('abc def%2')
|
|
|
'abc%20def%252'
|
|
|
>>> quotepath('abc def%')
|
|
|
'abc%20def%25'
|
|
|
'''
|
|
|
global _safeset, _hex
|
|
|
if _safeset is None:
|
|
|
_safeset = util.set(_safe)
|
|
|
_hex = util.set('abcdefABCDEF0123456789')
|
|
|
l = list(path)
|
|
|
for i in xrange(len(l)):
|
|
|
c = l[i]
|
|
|
if c == '%' and i + 2 < len(l) and (l[i+1] in _hex and l[i+2] in _hex):
|
|
|
pass
|
|
|
elif c not in _safeset:
|
|
|
l[i] = '%%%02X' % ord(c)
|
|
|
return ''.join(l)
|
|
|
|
|
|
class httprepository(remoterepository):
|
|
|
def __init__(self, ui, path):
|
|
|
self.path = path
|
|
|
self.caps = None
|
|
|
self.handler = None
|
|
|
scheme, netloc, urlpath, query, frag = urlparse.urlsplit(path)
|
|
|
if query or frag:
|
|
|
raise util.Abort(_('unsupported URL component: "%s"') %
|
|
|
(query or frag))
|
|
|
if not urlpath:
|
|
|
urlpath = '/'
|
|
|
urlpath = quotepath(urlpath)
|
|
|
host, port, user, passwd = netlocsplit(netloc)
|
|
|
|
|
|
# urllib cannot handle URLs with embedded user or passwd
|
|
|
self._url = urlparse.urlunsplit((scheme, netlocunsplit(host, port),
|
|
|
urlpath, '', ''))
|
|
|
self.ui = ui
|
|
|
self.ui.debug(_('using %s\n') % self._url)
|
|
|
|
|
|
proxyurl = ui.config("http_proxy", "host") or os.getenv('http_proxy')
|
|
|
# XXX proxyauthinfo = None
|
|
|
self.handler = httphandler()
|
|
|
handlers = [self.handler]
|
|
|
|
|
|
if proxyurl:
|
|
|
# proxy can be proper url or host[:port]
|
|
|
if not (proxyurl.startswith('http:') or
|
|
|
proxyurl.startswith('https:')):
|
|
|
proxyurl = 'http://' + proxyurl + '/'
|
|
|
snpqf = urlparse.urlsplit(proxyurl)
|
|
|
proxyscheme, proxynetloc, proxypath, proxyquery, proxyfrag = snpqf
|
|
|
hpup = netlocsplit(proxynetloc)
|
|
|
|
|
|
proxyhost, proxyport, proxyuser, proxypasswd = hpup
|
|
|
if not proxyuser:
|
|
|
proxyuser = ui.config("http_proxy", "user")
|
|
|
proxypasswd = ui.config("http_proxy", "passwd")
|
|
|
|
|
|
# see if we should use a proxy for this url
|
|
|
no_list = [ "localhost", "127.0.0.1" ]
|
|
|
no_list.extend([p.lower() for
|
|
|
p in ui.configlist("http_proxy", "no")])
|
|
|
no_list.extend([p.strip().lower() for
|
|
|
p in os.getenv("no_proxy", '').split(',')
|
|
|
if p.strip()])
|
|
|
# "http_proxy.always" config is for running tests on localhost
|
|
|
if (not ui.configbool("http_proxy", "always") and
|
|
|
host.lower() in no_list):
|
|
|
# avoid auto-detection of proxy settings by appending
|
|
|
# a ProxyHandler with no proxies defined.
|
|
|
handlers.append(urllib2.ProxyHandler({}))
|
|
|
ui.debug(_('disabling proxy for %s\n') % host)
|
|
|
else:
|
|
|
proxyurl = urlparse.urlunsplit((
|
|
|
proxyscheme, netlocunsplit(proxyhost, proxyport,
|
|
|
proxyuser, proxypasswd or ''),
|
|
|
proxypath, proxyquery, proxyfrag))
|
|
|
handlers.append(urllib2.ProxyHandler({scheme: proxyurl}))
|
|
|
ui.debug(_('proxying through http://%s:%s\n') %
|
|
|
(proxyhost, proxyport))
|
|
|
|
|
|
# urllib2 takes proxy values from the environment and those
|
|
|
# will take precedence if found, so drop them
|
|
|
for env in ["HTTP_PROXY", "http_proxy", "no_proxy"]:
|
|
|
try:
|
|
|
if env in os.environ:
|
|
|
del os.environ[env]
|
|
|
except OSError:
|
|
|
pass
|
|
|
|
|
|
passmgr = passwordmgr(ui)
|
|
|
if user:
|
|
|
ui.debug(_('http auth: user %s, password %s\n') %
|
|
|
(user, passwd and '*' * len(passwd) or 'not set'))
|
|
|
netloc = host
|
|
|
if port:
|
|
|
netloc += ':' + port
|
|
|
# Python < 2.4.3 uses only the netloc to search for a password
|
|
|
passmgr.add_password(None, (self._url, netloc), user, passwd or '')
|
|
|
|
|
|
handlers.extend((urllib2.HTTPBasicAuthHandler(passmgr),
|
|
|
httpdigestauthhandler(passmgr)))
|
|
|
opener = urllib2.build_opener(*handlers)
|
|
|
|
|
|
# 1.0 here is the _protocol_ version
|
|
|
opener.addheaders = [('User-agent', 'mercurial/proto-1.0')]
|
|
|
urllib2.install_opener(opener)
|
|
|
|
|
|
def __del__(self):
|
|
|
if self.handler:
|
|
|
self.handler.close_all()
|
|
|
self.handler = None
|
|
|
|
|
|
def url(self):
|
|
|
return self.path
|
|
|
|
|
|
# look up capabilities only when needed
|
|
|
|
|
|
def get_caps(self):
|
|
|
if self.caps is None:
|
|
|
try:
|
|
|
self.caps = util.set(self.do_read('capabilities').split())
|
|
|
except repo.RepoError:
|
|
|
self.caps = util.set()
|
|
|
self.ui.debug(_('capabilities: %s\n') %
|
|
|
(' '.join(self.caps or ['none'])))
|
|
|
return self.caps
|
|
|
|
|
|
capabilities = property(get_caps)
|
|
|
|
|
|
def lock(self):
|
|
|
raise util.Abort(_('operation not supported over http'))
|
|
|
|
|
|
def do_cmd(self, cmd, **args):
|
|
|
data = args.pop('data', None)
|
|
|
headers = args.pop('headers', {})
|
|
|
self.ui.debug(_("sending %s command\n") % cmd)
|
|
|
q = {"cmd": cmd}
|
|
|
q.update(args)
|
|
|
qs = '?%s' % urllib.urlencode(q)
|
|
|
cu = "%s%s" % (self._url, qs)
|
|
|
try:
|
|
|
if data:
|
|
|
self.ui.debug(_("sending %s bytes\n") % len(data))
|
|
|
resp = urllib2.urlopen(request(cu, data, headers))
|
|
|
except urllib2.HTTPError, inst:
|
|
|
if inst.code == 401:
|
|
|
raise util.Abort(_('authorization failed'))
|
|
|
raise
|
|
|
except httplib.HTTPException, inst:
|
|
|
self.ui.debug(_('http error while sending %s command\n') % cmd)
|
|
|
self.ui.print_exc()
|
|
|
raise IOError(None, inst)
|
|
|
except IndexError:
|
|
|
# this only happens with Python 2.3, later versions raise URLError
|
|
|
raise util.Abort(_('http error, possibly caused by proxy setting'))
|
|
|
# record the url we got redirected to
|
|
|
resp_url = resp.geturl()
|
|
|
if resp_url.endswith(qs):
|
|
|
resp_url = resp_url[:-len(qs)]
|
|
|
if self._url != resp_url:
|
|
|
self.ui.status(_('real URL is %s\n') % resp_url)
|
|
|
self._url = resp_url
|
|
|
try:
|
|
|
proto = resp.getheader('content-type')
|
|
|
except AttributeError:
|
|
|
proto = resp.headers['content-type']
|
|
|
|
|
|
# accept old "text/plain" and "application/hg-changegroup" for now
|
|
|
if not (proto.startswith('application/mercurial-') or
|
|
|
proto.startswith('text/plain') or
|
|
|
proto.startswith('application/hg-changegroup')):
|
|
|
self.ui.debug(_("Requested URL: '%s'\n") % cu)
|
|
|
raise repo.RepoError(_("'%s' does not appear to be an hg repository")
|
|
|
% self._url)
|
|
|
|
|
|
if proto.startswith('application/mercurial-'):
|
|
|
try:
|
|
|
version = proto.split('-', 1)[1]
|
|
|
version_info = tuple([int(n) for n in version.split('.')])
|
|
|
except ValueError:
|
|
|
raise repo.RepoError(_("'%s' sent a broken Content-Type "
|
|
|
"header (%s)") % (self._url, proto))
|
|
|
if version_info > (0, 1):
|
|
|
raise repo.RepoError(_("'%s' uses newer protocol %s") %
|
|
|
(self._url, version))
|
|
|
|
|
|
return resp
|
|
|
|
|
|
def do_read(self, cmd, **args):
|
|
|
fp = self.do_cmd(cmd, **args)
|
|
|
try:
|
|
|
return fp.read()
|
|
|
finally:
|
|
|
# if using keepalive, allow connection to be reused
|
|
|
fp.close()
|
|
|
|
|
|
def lookup(self, key):
|
|
|
self.requirecap('lookup', _('look up remote revision'))
|
|
|
d = self.do_cmd("lookup", key = key).read()
|
|
|
success, data = d[:-1].split(' ', 1)
|
|
|
if int(success):
|
|
|
return bin(data)
|
|
|
raise repo.RepoError(data)
|
|
|
|
|
|
def heads(self):
|
|
|
d = self.do_read("heads")
|
|
|
try:
|
|
|
return map(bin, d[:-1].split(" "))
|
|
|
except:
|
|
|
raise util.UnexpectedOutput(_("unexpected response:"), d)
|
|
|
|
|
|
def branches(self, nodes):
|
|
|
n = " ".join(map(hex, nodes))
|
|
|
d = self.do_read("branches", nodes=n)
|
|
|
try:
|
|
|
br = [ tuple(map(bin, b.split(" "))) for b in d.splitlines() ]
|
|
|
return br
|
|
|
except:
|
|
|
raise util.UnexpectedOutput(_("unexpected response:"), d)
|
|
|
|
|
|
def between(self, pairs):
|
|
|
n = "\n".join(["-".join(map(hex, p)) for p in pairs])
|
|
|
d = self.do_read("between", pairs=n)
|
|
|
try:
|
|
|
p = [ l and map(bin, l.split(" ")) or [] for l in d.splitlines() ]
|
|
|
return p
|
|
|
except:
|
|
|
raise util.UnexpectedOutput(_("unexpected response:"), d)
|
|
|
|
|
|
def changegroup(self, nodes, kind):
|
|
|
n = " ".join(map(hex, nodes))
|
|
|
f = self.do_cmd("changegroup", roots=n)
|
|
|
return util.chunkbuffer(zgenerator(f))
|
|
|
|
|
|
def changegroupsubset(self, bases, heads, source):
|
|
|
self.requirecap('changegroupsubset', _('look up remote changes'))
|
|
|
baselst = " ".join([hex(n) for n in bases])
|
|
|
headlst = " ".join([hex(n) for n in heads])
|
|
|
f = self.do_cmd("changegroupsubset", bases=baselst, heads=headlst)
|
|
|
return util.chunkbuffer(zgenerator(f))
|
|
|
|
|
|
def unbundle(self, cg, heads, source):
|
|
|
# have to stream bundle to a temp file because we do not have
|
|
|
# http 1.1 chunked transfer.
|
|
|
|
|
|
type = ""
|
|
|
types = self.capable('unbundle')
|
|
|
# servers older than d1b16a746db6 will send 'unbundle' as a
|
|
|
# boolean capability
|
|
|
try:
|
|
|
types = types.split(',')
|
|
|
except AttributeError:
|
|
|
types = [""]
|
|
|
if types:
|
|
|
for x in types:
|
|
|
if x in changegroup.bundletypes:
|
|
|
type = x
|
|
|
break
|
|
|
|
|
|
tempname = changegroup.writebundle(cg, None, type)
|
|
|
fp = httpsendfile(tempname, "rb")
|
|
|
try:
|
|
|
try:
|
|
|
rfp = self.do_cmd(
|
|
|
'unbundle', data=fp,
|
|
|
headers={'Content-Type': 'application/octet-stream'},
|
|
|
heads=' '.join(map(hex, heads)))
|
|
|
try:
|
|
|
ret = int(rfp.readline())
|
|
|
self.ui.write(rfp.read())
|
|
|
return ret
|
|
|
finally:
|
|
|
rfp.close()
|
|
|
except socket.error, err:
|
|
|
if err[0] in (errno.ECONNRESET, errno.EPIPE):
|
|
|
raise util.Abort(_('push failed: %s') % err[1])
|
|
|
raise util.Abort(err[1])
|
|
|
finally:
|
|
|
fp.close()
|
|
|
os.unlink(tempname)
|
|
|
|
|
|
def stream_out(self):
|
|
|
return self.do_cmd('stream_out')
|
|
|
|
|
|
class httpsrepository(httprepository):
|
|
|
def __init__(self, ui, path):
|
|
|
if not has_https:
|
|
|
raise util.Abort(_('Python support for SSL and HTTPS '
|
|
|
'is not installed'))
|
|
|
httprepository.__init__(self, ui, path)
|
|
|
|
|
|
def instance(ui, path, create):
|
|
|
if create:
|
|
|
raise util.Abort(_('cannot create new http repository'))
|
|
|
if path.startswith('https:'):
|
|
|
return httpsrepository(ui, path)
|
|
|
return httprepository(ui, path)
|
|
|
|