upstream/mercurial-mirror Commit - r36871:2cdf47e1

hgweb: refactor the request draining code...

Gregory Szorc -

r36871:2cdf47e1 default

parent child

mercurial/hgweb/request.py

0 +47 -6

             # hgweb/request.py - An http request from either CGI or the standalone server.
             #
             # Copyright 21 May 2005 - (c) 2005 Jake Edge <jake@edge2.net>
             # Copyright 2005, 2006 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import cgi
             import errno
             import socket
             import wsgiref.headers as wsgiheaders
             #import wsgiref.validate
             from .common import (
                 ErrorResponse,
                 HTTP_NOT_MODIFIED,
                 statusmessage,
             )
             from ..thirdparty import (
                 attr,
             )
             from .. import (
                 pycompat,
                 util,
             )
             shortcuts = {
                 'cl': [('cmd', ['changelog']), ('rev', None)],
                 'sl': [('cmd', ['shortlog']), ('rev', None)],
                 'cs': [('cmd', ['changeset']), ('node', None)],
                 'f': [('cmd', ['file']), ('filenode', None)],
                 'fl': [('cmd', ['filelog']), ('filenode', None)],
                 'fd': [('cmd', ['filediff']), ('node', None)],
                 'fa': [('cmd', ['annotate']), ('filenode', None)],
                 'mf': [('cmd', ['manifest']), ('manifest', None)],
                 'ca': [('cmd', ['archive']), ('node', None)],
                 'tags': [('cmd', ['tags'])],
                 'tip': [('cmd', ['changeset']), ('node', ['tip'])],
                 'static': [('cmd', ['static']), ('file', None)]
             }
             def normalize(form):
                 # first expand the shortcuts
                 for k in shortcuts:
                     if k in form:
                         for name, value in shortcuts[k]:
                             if value is None:
                                 value = form[k]
                             form[name] = value
                         del form[k]
                 # And strip the values
                 bytesform = {}
                 for k, v in form.iteritems():
                     bytesform[pycompat.bytesurl(k)] = [
                         pycompat.bytesurl(i.strip()) for i in v]
                 return bytesform
             @attr.s(frozen=True)
             class parsedrequest(object):
                 """Represents a parsed WSGI request / static HTTP request parameters."""
                 # Request method.
                 method = attr.ib()
                 # Full URL for this request.
                 url = attr.ib()
                 # URL without any path components. Just <proto>://<host><port>.
                 baseurl = attr.ib()
                 # Advertised URL. Like ``url`` and ``baseurl`` but uses SERVER_NAME instead
                 # of HTTP: Host header for hostname. This is likely what clients used.
                 advertisedurl = attr.ib()
                 advertisedbaseurl = attr.ib()
                 # WSGI application path.
                 apppath = attr.ib()
                 # List of path parts to be used for dispatch.
                 dispatchparts = attr.ib()
                 # URL path component (no query string) used for dispatch.
                 dispatchpath = attr.ib()
                 # Whether there is a path component to this request. This can be true
                 # when ``dispatchpath`` is empty due to REPO_NAME muckery.
                 havepathinfo = attr.ib()
                 # Raw query string (part after "?" in URL).
                 querystring = attr.ib()
                 # List of 2-tuples of query string arguments.
                 querystringlist = attr.ib()
                 # Dict of query string arguments. Values are lists with at least 1 item.
                 querystringdict = attr.ib()
                 # wsgiref.headers.Headers instance. Operates like a dict with case
                 # insensitive keys.
                 headers = attr.ib()
             def parserequestfromenv(env):
                 """Parse URL components from environment variables.
                 WSGI defines request attributes via environment variables. This function
                 parses the environment variables into a data structure.
                 """
                 # PEP-0333 defines the WSGI spec and is a useful reference for this code.
                 # We first validate that the incoming object conforms with the WSGI spec.
                 # We only want to be dealing with spec-conforming WSGI implementations.
                 # TODO enable this once we fix internal violations.
                 #wsgiref.validate.check_environ(env)
                 # PEP-0333 states that environment keys and values are native strings
                 # (bytes on Python 2 and str on Python 3). The code points for the Unicode
                 # strings on Python 3 must be between \00000-\000FF. We deal with bytes
                 # in Mercurial, so mass convert string keys and values to bytes.
                 if pycompat.ispy3:
                     env = {k.encode('latin-1'): v for k, v in env.iteritems()}
                     env = {k: v.encode('latin-1') if isinstance(v, str) else v
                            for k, v in env.iteritems()}
                 # https://www.python.org/dev/peps/pep-0333/#environ-variables defines
                 # the environment variables.
                 # https://www.python.org/dev/peps/pep-0333/#url-reconstruction defines
                 # how URLs are reconstructed.
                 fullurl = env['wsgi.url_scheme'] + '://'
                 advertisedfullurl = fullurl
                 def addport(s):
                     if env['wsgi.url_scheme'] == 'https':
                         if env['SERVER_PORT'] != '443':
                             s += ':' + env['SERVER_PORT']
                     else:
                         if env['SERVER_PORT'] != '80':
                             s += ':' + env['SERVER_PORT']
                     return s
                 if env.get('HTTP_HOST'):
                     fullurl += env['HTTP_HOST']
                 else:
                     fullurl += env['SERVER_NAME']
                     fullurl = addport(fullurl)
                 advertisedfullurl += env['SERVER_NAME']
                 advertisedfullurl = addport(advertisedfullurl)
                 baseurl = fullurl
                 advertisedbaseurl = advertisedfullurl
                 fullurl += util.urlreq.quote(env.get('SCRIPT_NAME', ''))
                 advertisedfullurl += util.urlreq.quote(env.get('SCRIPT_NAME', ''))
                 fullurl += util.urlreq.quote(env.get('PATH_INFO', ''))
                 advertisedfullurl += util.urlreq.quote(env.get('PATH_INFO', ''))
                 if env.get('QUERY_STRING'):
                     fullurl += '?' + env['QUERY_STRING']
                     advertisedfullurl += '?' + env['QUERY_STRING']
                 # When dispatching requests, we look at the URL components (PATH_INFO
                 # and QUERY_STRING) after the application root (SCRIPT_NAME). But hgwebdir
                 # has the concept of "virtual" repositories. This is defined via REPO_NAME.
                 # If REPO_NAME is defined, we append it to SCRIPT_NAME to form a new app
                 # root. We also exclude its path components from PATH_INFO when resolving
                 # the dispatch path.
                 apppath = env['SCRIPT_NAME']
                 if env.get('REPO_NAME'):
                     if not apppath.endswith('/'):
                         apppath += '/'
                     apppath += env.get('REPO_NAME')
                 if 'PATH_INFO' in env:
                     dispatchparts = env['PATH_INFO'].strip('/').split('/')
                     # Strip out repo parts.
                     repoparts = env.get('REPO_NAME', '').split('/')
                     if dispatchparts[:len(repoparts)] == repoparts:
                         dispatchparts = dispatchparts[len(repoparts):]
                 else:
                     dispatchparts = []
                 dispatchpath = '/'.join(dispatchparts)
                 querystring = env.get('QUERY_STRING', '')
                 # We store as a list so we have ordering information. We also store as
                 # a dict to facilitate fast lookup.
                 querystringlist = util.urlreq.parseqsl(querystring, keep_blank_values=True)
                 querystringdict = {}
                 for k, v in querystringlist:
                     if k in querystringdict:
                         querystringdict[k].append(v)
                     else:
                         querystringdict[k] = [v]
                 # HTTP_* keys contain HTTP request headers. The Headers structure should
                 # perform case normalization for us. We just rewrite underscore to dash
                 # so keys match what likely went over the wire.
                 headers = []
                 for k, v in env.iteritems():
                     if k.startswith('HTTP_'):
                         headers.append((k[len('HTTP_'):].replace('_', '-'), v))
                 headers = wsgiheaders.Headers(headers)
                 # This is kind of a lie because the HTTP header wasn't explicitly
                 # sent. But for all intents and purposes it should be OK to lie about
                 # this, since a consumer will either either value to determine how many
                 # bytes are available to read.
                 if 'CONTENT_LENGTH' in env and 'HTTP_CONTENT_LENGTH' not in env:
                     headers['Content-Length'] = env['CONTENT_LENGTH']
                 return parsedrequest(method=env['REQUEST_METHOD'],
                                      url=fullurl, baseurl=baseurl,
                                      advertisedurl=advertisedfullurl,
                                      advertisedbaseurl=advertisedbaseurl,
                                      apppath=apppath,
                                      dispatchparts=dispatchparts, dispatchpath=dispatchpath,
                                      havepathinfo='PATH_INFO' in env,
                                      querystring=querystring,
                                      querystringlist=querystringlist,
                                      querystringdict=querystringdict,
                                      headers=headers)
             class wsgirequest(object):
                 """Higher-level API for a WSGI request.
                 WSGI applications are invoked with 2 arguments. They are used to
                 instantiate instances of this class, which provides higher-level APIs
                 for obtaining request parameters, writing HTTP output, etc.
                 """
                 def __init__(self, wsgienv, start_response):
                     version = wsgienv[r'wsgi.version']
                     if (version < (1, 0)) or (version >= (2, 0)):
                         raise RuntimeError("Unknown and unsupported WSGI version %d.%d"
                                            % version)
                     self.inp = wsgienv[r'wsgi.input']
                     if r'HTTP_CONTENT_LENGTH' in wsgienv:
                         self.inp = util.cappedreader(self.inp,
                                                      int(wsgienv[r'HTTP_CONTENT_LENGTH']))
                     elif r'CONTENT_LENGTH' in wsgienv:
                         self.inp = util.cappedreader(self.inp,
                                                      int(wsgienv[r'CONTENT_LENGTH']))
                     self.err = wsgienv[r'wsgi.errors']
                     self.threaded = wsgienv[r'wsgi.multithread']
                     self.multiprocess = wsgienv[r'wsgi.multiprocess']
                     self.run_once = wsgienv[r'wsgi.run_once']
                     self.env = wsgienv
                     self.form = normalize(cgi.parse(self.inp,
                                                     self.env,
                                                     keep_blank_values=1))
                     self._start_response = start_response
                     self.server_write = None
                     self.headers = []
-                def drain(self):
-                    '''need to read all data from request, httplib is half-duplex'''
-                    length = int(self.env.get('CONTENT_LENGTH') or 0)
-                    for s in util.filechunkiter(self.inp, limit=length):
-                        pass
                 def respond(self, status, type, filename=None, body=None):
                     if not isinstance(type, str):
                         type = pycompat.sysstr(type)
                     if self._start_response is not None:
                         self.headers.append((r'Content-Type', type))
                         if filename:
                             filename = (filename.rpartition('/')[-1]
                                         .replace('\\', '\\\\').replace('"', '\\"'))
                             self.headers.append(('Content-Disposition',
                                                  'inline; filename="%s"' % filename))
                         if body is not None:
                             self.headers.append((r'Content-Length', str(len(body))))
                         for k, v in self.headers:
                             if not isinstance(v, str):
                                 raise TypeError('header value must be string: %r' % (v,))
                         if isinstance(status, ErrorResponse):
                             self.headers.extend(status.headers)
                             if status.code == HTTP_NOT_MODIFIED:
                                 # RFC 2616 Section 10.3.5: 304 Not Modified has cases where
                                 # it MUST NOT include any headers other than these and no
                                 # body
                                 self.headers = [(k, v) for (k, v) in self.headers if
                                                 k in ('Date', 'ETag', 'Expires',
                                                       'Cache-Control', 'Vary')]
                             status = statusmessage(status.code, pycompat.bytestr(status))
                         elif status == 200:
                             status = '200 Script output follows'
                         elif isinstance(status, int):
                             status = statusmessage(status)
+                        # Various HTTP clients (notably httplib) won't read the HTTP
+                        # response until the HTTP request has been sent in full. If servers
+                        # (us) send a response before the HTTP request has been fully sent,
+                        # the connection may deadlock because neither end is reading.
+                        #
+                        # We work around this by "draining" the request data before
+                        # sending any response in some conditions.
+                        drain = False
+                        close = False
+                        # If the client sent Expect: 100-continue, we assume it is smart
+                        # enough to deal with the server sending a response before reading
+                        # the request. (httplib doesn't do this.)
+                        if self.env.get(r'HTTP_EXPECT', r'').lower() == r'100-continue':
+                            pass
+                        # Only tend to request methods that have bodies. Strictly speaking,
+                        # we should sniff for a body. But this is fine for our existing
+                        # WSGI applications.
+                        elif self.env[r'REQUEST_METHOD'] not in (r'POST', r'PUT'):
+                            pass
+                        else:
+                            # If we don't know how much data to read, there's no guarantee
+                            # that we can drain the request responsibly. The WSGI
+                            # specification only says that servers *should* ensure the
+                            # input stream doesn't overrun the actual request. So there's
+                            # no guarantee that reading until EOF won't corrupt the stream
+                            # state.
+                            if not isinstance(self.inp, util.cappedreader):
+                                close = True
+                            else:
+                                # We /could/ only drain certain HTTP response codes. But 200
+                                # and non-200 wire protocol responses both require draining.
+                                # Since we have a capped reader in place for all situations
+                                # where we drain, it is safe to read from that stream. We'll
+                                # either do a drain or no-op if we're already at EOF.
+                                drain = True
+                        if close:
+                            self.headers.append((r'Connection', r'Close'))
+                        if drain:
+                            assert isinstance(self.inp, util.cappedreader)
+                            while True:
+                                chunk = self.inp.read(32768)
+                                if not chunk:
+                                    break
                         self.server_write = self._start_response(
                             pycompat.sysstr(status), self.headers)
                         self._start_response = None
                         self.headers = []
                     if body is not None:
                         self.write(body)
                         self.server_write = None
                 def write(self, thing):
                     if thing:
                         try:
                             self.server_write(thing)
                         except socket.error as inst:
                             if inst[0] != errno.ECONNRESET:
                                 raise
                 def flush(self):
                     return None
             def wsgiapplication(app_maker):
                 '''For compatibility with old CGI scripts. A plain hgweb() or hgwebdir()
                 can and should now be used as a WSGI application.'''
                 application = app_maker()
                 def run_wsgi(env, respond):
                     return application(env, respond)
                 return run_wsgi

mercurial/wireprotoserver.py

0 0 -18

             # Copyright 21 May 2005 - (c) 2005 Jake Edge <jake@edge2.net>
             # Copyright 2005-2007 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import contextlib
             import struct
             import sys
             import threading
             from .i18n import _
             from . import (
                 encoding,
                 error,
                 hook,
                 pycompat,
                 util,
                 wireproto,
                 wireprototypes,
             )
             stringio = util.stringio
             urlerr = util.urlerr
             urlreq = util.urlreq
             HTTP_OK = 200
             HGTYPE = 'application/mercurial-0.1'
             HGTYPE2 = 'application/mercurial-0.2'
             HGERRTYPE = 'application/hg-error'
             SSHV1 = wireprototypes.SSHV1
             SSHV2 = wireprototypes.SSHV2
             def decodevaluefromheaders(req, headerprefix):
                 """Decode a long value from multiple HTTP request headers.
                 Returns the value as a bytes, not a str.
                 """
                 chunks = []
                 i = 1
                 while True:
                     v = req.headers.get(b'%s-%d' % (headerprefix, i))
                     if v is None:
                         break
                     chunks.append(pycompat.bytesurl(v))
                     i += 1
                 return ''.join(chunks)
             class httpv1protocolhandler(wireprototypes.baseprotocolhandler):
                 def __init__(self, wsgireq, req, ui, checkperm):
                     self._wsgireq = wsgireq
                     self._req = req
                     self._ui = ui
                     self._checkperm = checkperm
                 @property
                 def name(self):
                     return 'http-v1'
                 def getargs(self, args):
                     knownargs = self._args()
                     data = {}
                     keys = args.split()
                     for k in keys:
                         if k == '*':
                             star = {}
                             for key in knownargs.keys():
                                 if key != 'cmd' and key not in keys:
                                     star[key] = knownargs[key][0]
                             data['*'] = star
                         else:
                             data[k] = knownargs[k][0]
                     return [data[k] for k in keys]
                 def _args(self):
                     args = util.rapply(pycompat.bytesurl, self._wsgireq.form.copy())
                     postlen = int(self._req.headers.get(b'X-HgArgs-Post', 0))
                     if postlen:
                         args.update(urlreq.parseqs(
                             self._wsgireq.inp.read(postlen), keep_blank_values=True))
                         return args
                     argvalue = decodevaluefromheaders(self._req, b'X-HgArg')
                     args.update(urlreq.parseqs(argvalue, keep_blank_values=True))
                     return args
                 def forwardpayload(self, fp):
                     # Existing clients *always* send Content-Length.
                     length = int(self._req.headers[b'Content-Length'])
                     # If httppostargs is used, we need to read Content-Length
                     # minus the amount that was consumed by args.
                     length -= int(self._req.headers.get(b'X-HgArgs-Post', 0))
                     for s in util.filechunkiter(self._wsgireq.inp, limit=length):
                         fp.write(s)
                 @contextlib.contextmanager
                 def mayberedirectstdio(self):
                     oldout = self._ui.fout
                     olderr = self._ui.ferr
                     out = util.stringio()
                     try:
                         self._ui.fout = out
                         self._ui.ferr = out
                         yield out
                     finally:
                         self._ui.fout = oldout
                         self._ui.ferr = olderr
                 def client(self):
                     return 'remote:%s:%s:%s' % (
                         self._wsgireq.env.get('wsgi.url_scheme') or 'http',
                         urlreq.quote(self._wsgireq.env.get('REMOTE_HOST', '')),
                         urlreq.quote(self._wsgireq.env.get('REMOTE_USER', '')))
                 def addcapabilities(self, repo, caps):
                     caps.append('httpheader=%d' %
                                 repo.ui.configint('server', 'maxhttpheaderlen'))
                     if repo.ui.configbool('experimental', 'httppostargs'):
                         caps.append('httppostargs')
                     # FUTURE advertise 0.2rx once support is implemented
                     # FUTURE advertise minrx and mintx after consulting config option
                     caps.append('httpmediatype=0.1rx,0.1tx,0.2tx')
                     compengines = wireproto.supportedcompengines(repo.ui, util.SERVERROLE)
                     if compengines:
                         comptypes = ','.join(urlreq.quote(e.wireprotosupport().name)
                                              for e in compengines)
                         caps.append('compression=%s' % comptypes)
                     return caps
                 def checkperm(self, perm):
                     return self._checkperm(perm)
             # This method exists mostly so that extensions like remotefilelog can
             # disable a kludgey legacy method only over http. As of early 2018,
             # there are no other known users, so with any luck we can discard this
             # hook if remotefilelog becomes a first-party extension.
             def iscmd(cmd):
                 return cmd in wireproto.commands
             def handlewsgirequest(rctx, wsgireq, req, checkperm):
                 """Possibly process a wire protocol request.
                 If the current request is a wire protocol request, the request is
                 processed by this function.
                 ``wsgireq`` is a ``wsgirequest`` instance.
                 ``req`` is a ``parsedrequest`` instance.
                 Returns a 2-tuple of (bool, response) where the 1st element indicates
                 whether the request was handled and the 2nd element is a return
                 value for a WSGI application (often a generator of bytes).
                 """
                 # Avoid cycle involving hg module.
                 from .hgweb import common as hgwebcommon
                 repo = rctx.repo
                 # HTTP version 1 wire protocol requests are denoted by a "cmd" query
                 # string parameter. If it isn't present, this isn't a wire protocol
                 # request.
                 if 'cmd' not in req.querystringdict:
                     return False, None
                 cmd = req.querystringdict['cmd'][0]
                 # The "cmd" request parameter is used by both the wire protocol and hgweb.
                 # While not all wire protocol commands are available for all transports,
                 # if we see a "cmd" value that resembles a known wire protocol command, we
                 # route it to a protocol handler. This is better than routing possible
                 # wire protocol requests to hgweb because it prevents hgweb from using
                 # known wire protocol commands and it is less confusing for machine
                 # clients.
                 if not iscmd(cmd):
                     return False, None
                 # The "cmd" query string argument is only valid on the root path of the
                 # repo. e.g. ``/?cmd=foo``, ``/repo?cmd=foo``. URL paths within the repo
                 # like ``/blah?cmd=foo`` are not allowed. So don't recognize the request
                 # in this case. We send an HTTP 404 for backwards compatibility reasons.
                 if req.dispatchpath:
                     res = _handlehttperror(
                         hgwebcommon.ErrorResponse(hgwebcommon.HTTP_NOT_FOUND), wsgireq,
                         req)
                     return True, res
                 proto = httpv1protocolhandler(wsgireq, req, repo.ui,
                                               lambda perm: checkperm(rctx, wsgireq, perm))
                 # The permissions checker should be the only thing that can raise an
                 # ErrorResponse. It is kind of a layer violation to catch an hgweb
                 # exception here. So consider refactoring into a exception type that
                 # is associated with the wire protocol.
                 try:
                     res = _callhttp(repo, wsgireq, req, proto, cmd)
                 except hgwebcommon.ErrorResponse as e:
                     res = _handlehttperror(e, wsgireq, req)
                 return True, res
             def _httpresponsetype(ui, req, prefer_uncompressed):
                 """Determine the appropriate response type and compression settings.
                 Returns a tuple of (mediatype, compengine, engineopts).
                 """
                 # Determine the response media type and compression engine based
                 # on the request parameters.
                 protocaps = decodevaluefromheaders(req, 'X-HgProto').split(' ')
                 if '0.2' in protocaps:
                     # All clients are expected to support uncompressed data.
                     if prefer_uncompressed:
                         return HGTYPE2, util._noopengine(), {}
                     # Default as defined by wire protocol spec.
                     compformats = ['zlib', 'none']
                     for cap in protocaps:
                         if cap.startswith('comp='):
                             compformats = cap[5:].split(',')
                             break
                     # Now find an agreed upon compression format.
                     for engine in wireproto.supportedcompengines(ui, util.SERVERROLE):
                         if engine.wireprotosupport().name in compformats:
                             opts = {}
                             level = ui.configint('server', '%slevel' % engine.name())
                             if level is not None:
                                 opts['level'] = level
                             return HGTYPE2, engine, opts
                     # No mutually supported compression format. Fall back to the
                     # legacy protocol.
                 # Don't allow untrusted settings because disabling compression or
                 # setting a very high compression level could lead to flooding
                 # the server's network or CPU.
                 opts = {'level': ui.configint('server', 'zliblevel')}
                 return HGTYPE, util.compengines['zlib'], opts
             def _callhttp(repo, wsgireq, req, proto, cmd):
                 def genversion2(gen, engine, engineopts):
                     # application/mercurial-0.2 always sends a payload header
                     # identifying the compression engine.
                     name = engine.wireprotosupport().name
                     assert 0 < len(name) < 256
                     yield struct.pack('B', len(name))
                     yield name
                     for chunk in gen:
                         yield chunk
                 if not wireproto.commands.commandavailable(cmd, proto):
                     wsgireq.respond(HTTP_OK, HGERRTYPE,
                                     body=_('requested wire protocol command is not '
                                            'available over HTTP'))
                     return []
                 proto.checkperm(wireproto.commands[cmd].permission)
                 rsp = wireproto.dispatch(repo, proto, cmd)
                 if isinstance(rsp, bytes):
                     wsgireq.respond(HTTP_OK, HGTYPE, body=rsp)
                     return []
                 elif isinstance(rsp, wireprototypes.bytesresponse):
                     wsgireq.respond(HTTP_OK, HGTYPE, body=rsp.data)
                     return []
                 elif isinstance(rsp, wireprototypes.streamreslegacy):
                     gen = rsp.gen
                     wsgireq.respond(HTTP_OK, HGTYPE)
                     return gen
                 elif isinstance(rsp, wireprototypes.streamres):
                     gen = rsp.gen
                     # This code for compression should not be streamres specific. It
                     # is here because we only compress streamres at the moment.
                     mediatype, engine, engineopts = _httpresponsetype(
                         repo.ui, req, rsp.prefer_uncompressed)
                     gen = engine.compressstream(gen, engineopts)
                     if mediatype == HGTYPE2:
                         gen = genversion2(gen, engine, engineopts)
                     wsgireq.respond(HTTP_OK, mediatype)
                     return gen
                 elif isinstance(rsp, wireprototypes.pushres):
                     rsp = '%d\n%s' % (rsp.res, rsp.output)
                     wsgireq.respond(HTTP_OK, HGTYPE, body=rsp)
                     return []
                 elif isinstance(rsp, wireprototypes.pusherr):
-                    # This is the httplib workaround documented in _handlehttperror().
-                    wsgireq.drain()
                     rsp = '0\n%s\n' % rsp.res
                     wsgireq.respond(HTTP_OK, HGTYPE, body=rsp)
                     return []
                 elif isinstance(rsp, wireprototypes.ooberror):
                     rsp = rsp.message
                     wsgireq.respond(HTTP_OK, HGERRTYPE, body=rsp)
                     return []
                 raise error.ProgrammingError('hgweb.protocol internal failure', rsp)
             def _handlehttperror(e, wsgireq, req):
                 """Called when an ErrorResponse is raised during HTTP request processing."""
-                # Clients using Python's httplib are stateful: the HTTP client
-                # won't process an HTTP response until all request data is
-                # sent to the server. The intent of this code is to ensure
-                # we always read HTTP request data from the client, thus
-                # ensuring httplib transitions to a state that allows it to read
-                # the HTTP response. In other words, it helps prevent deadlocks
-                # on clients using httplib.
-                if (req.method == 'POST' and
-                    # But not if Expect: 100-continue is being used.
-                    (req.headers.get('Expect', '').lower() != '100-continue')):
-                    wsgireq.drain()
-                else:
-                    wsgireq.headers.append((r'Connection', r'Close'))
                 # TODO This response body assumes the failed command was
                 # "unbundle." That assumption is not always valid.
                 wsgireq.respond(e, HGTYPE, body='0\n%s\n' % pycompat.bytestr(e))
                 return ''
             def _sshv1respondbytes(fout, value):
                 """Send a bytes response for protocol version 1."""
                 fout.write('%d\n' % len(value))
                 fout.write(value)
                 fout.flush()
             def _sshv1respondstream(fout, source):
                 write = fout.write
                 for chunk in source.gen:
                     write(chunk)
                 fout.flush()
             def _sshv1respondooberror(fout, ferr, rsp):
                 ferr.write(b'%s\n-\n' % rsp)
                 ferr.flush()
                 fout.write(b'\n')
                 fout.flush()
             class sshv1protocolhandler(wireprototypes.baseprotocolhandler):
                 """Handler for requests services via version 1 of SSH protocol."""
                 def __init__(self, ui, fin, fout):
                     self._ui = ui
                     self._fin = fin
                     self._fout = fout
                 @property
                 def name(self):
                     return wireprototypes.SSHV1
                 def getargs(self, args):
                     data = {}
                     keys = args.split()
                     for n in xrange(len(keys)):
                         argline = self._fin.readline()[:-1]
                         arg, l = argline.split()
                         if arg not in keys:
                             raise error.Abort(_("unexpected parameter %r") % arg)
                         if arg == '*':
                             star = {}
                             for k in xrange(int(l)):
                                 argline = self._fin.readline()[:-1]
                                 arg, l = argline.split()
                                 val = self._fin.read(int(l))
                                 star[arg] = val
                             data['*'] = star
                         else:
                             val = self._fin.read(int(l))
                             data[arg] = val
                     return [data[k] for k in keys]
                 def forwardpayload(self, fpout):
                     # We initially send an empty response. This tells the client it is
                     # OK to start sending data. If a client sees any other response, it
                     # interprets it as an error.
                     _sshv1respondbytes(self._fout, b'')
                     # The file is in the form:
                     #
                     # <chunk size>\n<chunk>
                     # ...
                     # 0\n
                     count = int(self._fin.readline())
                     while count:
                         fpout.write(self._fin.read(count))
                         count = int(self._fin.readline())
                 @contextlib.contextmanager
                 def mayberedirectstdio(self):
                     yield None
                 def client(self):
                     client = encoding.environ.get('SSH_CLIENT', '').split(' ', 1)[0]
                     return 'remote:ssh:' + client
                 def addcapabilities(self, repo, caps):
                     return caps
                 def checkperm(self, perm):
                     pass
             class sshv2protocolhandler(sshv1protocolhandler):
                 """Protocol handler for version 2 of the SSH protocol."""
                 @property
                 def name(self):
                     return wireprototypes.SSHV2
             def _runsshserver(ui, repo, fin, fout, ev):
                 # This function operates like a state machine of sorts. The following
                 # states are defined:
                 #
                 # protov1-serving
                 #    Server is in protocol version 1 serving mode. Commands arrive on
                 #    new lines. These commands are processed in this state, one command
                 #    after the other.
                 #
                 # protov2-serving
                 #    Server is in protocol version 2 serving mode.
                 #
                 # upgrade-initial
                 #    The server is going to process an upgrade request.
                 #
                 # upgrade-v2-filter-legacy-handshake
                 #    The protocol is being upgraded to version 2. The server is expecting
                 #    the legacy handshake from version 1.
                 #
                 # upgrade-v2-finish
                 #    The upgrade to version 2 of the protocol is imminent.
                 #
                 # shutdown
                 #    The server is shutting down, possibly in reaction to a client event.
                 #
                 # And here are their transitions:
                 #
                 # protov1-serving -> shutdown
                 #    When server receives an empty request or encounters another
                 #    error.
                 #
                 # protov1-serving -> upgrade-initial
                 #    An upgrade request line was seen.
                 #
                 # upgrade-initial -> upgrade-v2-filter-legacy-handshake
                 #    Upgrade to version 2 in progress. Server is expecting to
                 #    process a legacy handshake.
                 #
                 # upgrade-v2-filter-legacy-handshake -> shutdown
                 #    Client did not fulfill upgrade handshake requirements.
                 #
                 # upgrade-v2-filter-legacy-handshake -> upgrade-v2-finish
                 #    Client fulfilled version 2 upgrade requirements. Finishing that
                 #    upgrade.
                 #
                 # upgrade-v2-finish -> protov2-serving
                 #    Protocol upgrade to version 2 complete. Server can now speak protocol
                 #    version 2.
                 #
                 # protov2-serving -> protov1-serving
                 #    Ths happens by default since protocol version 2 is the same as
                 #    version 1 except for the handshake.
                 state = 'protov1-serving'
                 proto = sshv1protocolhandler(ui, fin, fout)
                 protoswitched = False
                 while not ev.is_set():
                     if state == 'protov1-serving':
                         # Commands are issued on new lines.
                         request = fin.readline()[:-1]
                         # Empty lines signal to terminate the connection.
                         if not request:
                             state = 'shutdown'
                             continue
                         # It looks like a protocol upgrade request. Transition state to
                         # handle it.
                         if request.startswith(b'upgrade '):
                             if protoswitched:
                                 _sshv1respondooberror(fout, ui.ferr,
                                                       b'cannot upgrade protocols multiple '
                                                       b'times')
                                 state = 'shutdown'
                                 continue
                             state = 'upgrade-initial'
                             continue
                         available = wireproto.commands.commandavailable(request, proto)
                         # This command isn't available. Send an empty response and go
                         # back to waiting for a new command.
                         if not available:
                             _sshv1respondbytes(fout, b'')
                             continue
                         rsp = wireproto.dispatch(repo, proto, request)
                         if isinstance(rsp, bytes):
                             _sshv1respondbytes(fout, rsp)
                         elif isinstance(rsp, wireprototypes.bytesresponse):
                             _sshv1respondbytes(fout, rsp.data)
                         elif isinstance(rsp, wireprototypes.streamres):
                             _sshv1respondstream(fout, rsp)
                         elif isinstance(rsp, wireprototypes.streamreslegacy):
                             _sshv1respondstream(fout, rsp)
                         elif isinstance(rsp, wireprototypes.pushres):
                             _sshv1respondbytes(fout, b'')
                             _sshv1respondbytes(fout, b'%d' % rsp.res)
                         elif isinstance(rsp, wireprototypes.pusherr):
                             _sshv1respondbytes(fout, rsp.res)
                         elif isinstance(rsp, wireprototypes.ooberror):
                             _sshv1respondooberror(fout, ui.ferr, rsp.message)
                         else:
                             raise error.ProgrammingError('unhandled response type from '
                                                          'wire protocol command: %s' % rsp)
                     # For now, protocol version 2 serving just goes back to version 1.
                     elif state == 'protov2-serving':
                         state = 'protov1-serving'
                         continue
                     elif state == 'upgrade-initial':
                         # We should never transition into this state if we've switched
                         # protocols.
                         assert not protoswitched
                         assert proto.name == wireprototypes.SSHV1
                         # Expected: upgrade <token> <capabilities>
                         # If we get something else, the request is malformed. It could be
                         # from a future client that has altered the upgrade line content.
                         # We treat this as an unknown command.
                         try:
                             token, caps = request.split(b' ')[1:]
                         except ValueError:
                             _sshv1respondbytes(fout, b'')
                             state = 'protov1-serving'
                             continue
                         # Send empty response if we don't support upgrading protocols.
                         if not ui.configbool('experimental', 'sshserver.support-v2'):
                             _sshv1respondbytes(fout, b'')
                             state = 'protov1-serving'
                             continue
                         try:
                             caps = urlreq.parseqs(caps)
                         except ValueError:
                             _sshv1respondbytes(fout, b'')
                             state = 'protov1-serving'
                             continue
                         # We don't see an upgrade request to protocol version 2. Ignore
                         # the upgrade request.
                         wantedprotos = caps.get(b'proto', [b''])[0]
                         if SSHV2 not in wantedprotos:
                             _sshv1respondbytes(fout, b'')
                             state = 'protov1-serving'
                             continue
                         # It looks like we can honor this upgrade request to protocol 2.
                         # Filter the rest of the handshake protocol request lines.
                         state = 'upgrade-v2-filter-legacy-handshake'
                         continue
                     elif state == 'upgrade-v2-filter-legacy-handshake':
                         # Client should have sent legacy handshake after an ``upgrade``
                         # request. Expected lines:
                         #
                         #    hello
                         #    between
                         #    pairs 81
                         #    0000...-0000...
                         ok = True
                         for line in (b'hello', b'between', b'pairs 81'):
                             request = fin.readline()[:-1]
                             if request != line:
                                 _sshv1respondooberror(fout, ui.ferr,
                                                       b'malformed handshake protocol: '
                                                       b'missing %s' % line)
                                 ok = False
                                 state = 'shutdown'
                                 break
                         if not ok:
                             continue
                         request = fin.read(81)
                         if request != b'%s-%s' % (b'0' * 40, b'0' * 40):
                             _sshv1respondooberror(fout, ui.ferr,
                                                   b'malformed handshake protocol: '
                                                   b'missing between argument value')
                             state = 'shutdown'
                             continue
                         state = 'upgrade-v2-finish'
                         continue
                     elif state == 'upgrade-v2-finish':
                         # Send the upgrade response.
                         fout.write(b'upgraded %s %s\n' % (token, SSHV2))
                         servercaps = wireproto.capabilities(repo, proto)
                         rsp = b'capabilities: %s' % servercaps.data
                         fout.write(b'%d\n%s\n' % (len(rsp), rsp))
                         fout.flush()
                         proto = sshv2protocolhandler(ui, fin, fout)
                         protoswitched = True
                         state = 'protov2-serving'
                         continue
                     elif state == 'shutdown':
                         break
                     else:
                         raise error.ProgrammingError('unhandled ssh server state: %s' %
                                                      state)
             class sshserver(object):
                 def __init__(self, ui, repo, logfh=None):
                     self._ui = ui
                     self._repo = repo
                     self._fin = ui.fin
                     self._fout = ui.fout
                     # Log write I/O to stdout and stderr if configured.
                     if logfh:
                         self._fout = util.makeloggingfileobject(
                             logfh, self._fout, 'o', logdata=True)
                         ui.ferr = util.makeloggingfileobject(
                             logfh, ui.ferr, 'e', logdata=True)
                     hook.redirect(True)
                     ui.fout = repo.ui.fout = ui.ferr
                     # Prevent insertion/deletion of CRs
                     util.setbinary(self._fin)
                     util.setbinary(self._fout)
                 def serve_forever(self):
                     self.serveuntil(threading.Event())
                     sys.exit(0)
                 def serveuntil(self, ev):
                     """Serve until a threading.Event is set."""
                     _runsshserver(self._ui, self._repo, self._fin, self._fout, ev)

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages