upstream/mercurial-mirror Commit - r36877:a88d68dc

hgweb: create dedicated type for WSGI responses...

Gregory Szorc -

r36877:a88d68dc default

parent child

mercurial/hgweb/hgweb_mod.py

0 +5 -3

                 def _runwsgi(self, wsgireq, repo):
                     req = wsgireq.req
+                    res = wsgireq.res
                     rctx = requestcontext(self, repo)
                     # This state is global across all threads.
                         wsgireq.headers = [h for h in wsgireq.headers
                                            if h[0] != 'Content-Security-Policy']
                         wsgireq.headers.append(('Content-Security-Policy', rctx.csp))
+                        res.headers['Content-Security-Policy'] = rctx.csp
-                    handled, res = wireprotoserver.handlewsgirequest(
+                    handled = wireprotoserver.handlewsgirequest(
-                        rctx, wsgireq, req, self.check_perm)
+                        rctx, wsgireq, req, res, self.check_perm)
                     if handled:
-                        return res
+                        return res.sendresponse()
                     if req.havepathinfo:
                         query = req.dispatchpath

mercurial/hgweb/request.py

0 +124 0

@@ -23,6 +23,7 b' from ..thirdparty import ('
23	attr,	23	attr,
24	)	24	)
25	from .. import (	25	from .. import (
		26	error,
26	pycompat,	27	pycompat,
27	util,	28	util,
28	)	29	)
@@ -201,6 +202,128 b' def parserequestfromenv(env, bodyfh):'
201	headers=headers,	202	headers=headers,
202	bodyfh=bodyfh)	203	bodyfh=bodyfh)
203		204
		205	class wsgiresponse(object):
		206	"""Represents a response to a WSGI request.
		207
		208	A response consists of a status line, headers, and a body.
		209
		210	Consumers must populate the ``status`` and ``headers`` fields and
		211	make a call to a ``setbody*()`` method before the response can be
		212	issued.
		213
		214	When it is time to start sending the response over the wire,
		215	``sendresponse()`` is called. It handles emitting the header portion
		216	of the response message. It then yields chunks of body data to be
		217	written to the peer. Typically, the WSGI application itself calls
		218	and returns the value from ``sendresponse()``.
		219	"""
		220
		221	def __init__(self, req, startresponse):
		222	"""Create an empty response tied to a specific request.
		223
		224	``req`` is a ``parsedrequest``. ``startresponse`` is the
		225	``start_response`` function passed to the WSGI application.
		226	"""
		227	self._req = req
		228	self._startresponse = startresponse
		229
		230	self.status = None
		231	self.headers = wsgiheaders.Headers([])
		232
		233	self._bodybytes = None
		234	self._bodygen = None
		235	self._started = False
		236
		237	def setbodybytes(self, b):
		238	"""Define the response body as static bytes."""
		239	if self._bodybytes is not None or self._bodygen is not None:
		240	raise error.ProgrammingError('cannot define body multiple times')
		241
		242	self._bodybytes = b
		243	self.headers['Content-Length'] = '%d' % len(b)
		244
		245	def setbodygen(self, gen):
		246	"""Define the response body as a generator of bytes."""
		247	if self._bodybytes is not None or self._bodygen is not None:
		248	raise error.ProgrammingError('cannot define body multiple times')
		249
		250	self._bodygen = gen
		251
		252	def sendresponse(self):
		253	"""Send the generated response to the client.
		254
		255	Before this is called, ``status`` must be set and one of
		256	``setbodybytes()`` or ``setbodygen()`` must be called.
		257
		258	Calling this method multiple times is not allowed.
		259	"""
		260	if self._started:
		261	raise error.ProgrammingError('sendresponse() called multiple times')
		262
		263	self._started = True
		264
		265	if not self.status:
		266	raise error.ProgrammingError('status line not defined')
		267
		268	if self._bodybytes is None and self._bodygen is None:
		269	raise error.ProgrammingError('response body not defined')
		270
		271	# Various HTTP clients (notably httplib) won't read the HTTP response
		272	# until the HTTP request has been sent in full. If servers (us) send a
		273	# response before the HTTP request has been fully sent, the connection
		274	# may deadlock because neither end is reading.
		275	#
		276	# We work around this by "draining" the request data before
		277	# sending any response in some conditions.
		278	drain = False
		279	close = False
		280
		281	# If the client sent Expect: 100-continue, we assume it is smart enough
		282	# to deal with the server sending a response before reading the request.
		283	# (httplib doesn't do this.)
		284	if self._req.headers.get('Expect', '').lower() == '100-continue':
		285	pass
		286	# Only tend to request methods that have bodies. Strictly speaking,
		287	# we should sniff for a body. But this is fine for our existing
		288	# WSGI applications.
		289	elif self._req.method not in ('POST', 'PUT'):
		290	pass
		291	else:
		292	# If we don't know how much data to read, there's no guarantee
		293	# that we can drain the request responsibly. The WSGI
		294	# specification only says that servers should ensure the
		295	# input stream doesn't overrun the actual request. So there's
		296	# no guarantee that reading until EOF won't corrupt the stream
		297	# state.
		298	if not isinstance(self._req.bodyfh, util.cappedreader):
		299	close = True
		300	else:
		301	# We /could/ only drain certain HTTP response codes. But 200 and
		302	# non-200 wire protocol responses both require draining. Since
		303	# we have a capped reader in place for all situations where we
		304	# drain, it is safe to read from that stream. We'll either do
		305	# a drain or no-op if we're already at EOF.
		306	drain = True
		307
		308	if close:
		309	self.headers['Connection'] = 'Close'
		310
		311	if drain:
		312	assert isinstance(self._req.bodyfh, util.cappedreader)
		313	while True:
		314	chunk = self._req.bodyfh.read(32768)
		315	if not chunk:
		316	break
		317
		318	self._startresponse(pycompat.sysstr(self.status), self.headers.items())
		319	if self._bodybytes:
		320	yield self._bodybytes
		321	elif self._bodygen:
		322	for chunk in self._bodygen:
		323	yield chunk
		324	else:
		325	error.ProgrammingError('do not know how to send body')
		326
204	class wsgirequest(object):	327	class wsgirequest(object):
205	"""Higher-level API for a WSGI request.	328	"""Higher-level API for a WSGI request.
206		329
@@ -228,6 +351,7 b' class wsgirequest(object):'
228	self.env = wsgienv	351	self.env = wsgienv
229	self.req = parserequestfromenv(wsgienv, inp)	352	self.req = parserequestfromenv(wsgienv, inp)
230	self.form = self.req.querystringdict	353	self.form = self.req.querystringdict
		354	self.res = wsgiresponse(self.req, start_response)
231	self._start_response = start_response	355	self._start_response = start_response
232	self.server_write = None	356	self.server_write = None
233	self.headers = []	357	self.headers = []

mercurial/wireprotoserver.py

0 +51 -45

             def iscmd(cmd):
                 return cmd in wireproto.commands
-            def handlewsgirequest(rctx, wsgireq, req, checkperm):
+            def handlewsgirequest(rctx, wsgireq, req, res, checkperm):
                 """Possibly process a wire protocol request.
                 If the current request is a wire protocol request, the request is
                 ``wsgireq`` is a ``wsgirequest`` instance.
                 ``req`` is a ``parsedrequest`` instance.
+                ``res`` is a ``wsgiresponse`` instance.
-                Returns a 2-tuple of (bool, response) where the 1st element indicates
+                Returns a bool indicating if the request was serviced. If set, the caller
-                whether the request was handled and the 2nd element is a return
+                should stop processing the request, as a response has already been issued.
-                value for a WSGI application (often a generator of bytes).
                 """
                 # Avoid cycle involving hg module.
                 from .hgweb import common as hgwebcommon
                 # string parameter. If it isn't present, this isn't a wire protocol
                 # request.
                 if 'cmd' not in req.querystringdict:
-                    return False, None
+                    return False
                 cmd = req.querystringdict['cmd'][0]
                 # known wire protocol commands and it is less confusing for machine
                 # clients.
                 if not iscmd(cmd):
-                    return False, None
+                    return False
                 # The "cmd" query string argument is only valid on the root path of the
                 # repo. e.g. ``/?cmd=foo``, ``/repo?cmd=foo``. URL paths within the repo
                 # like ``/blah?cmd=foo`` are not allowed. So don't recognize the request
                 # in this case. We send an HTTP 404 for backwards compatibility reasons.
                 if req.dispatchpath:
-                    res = _handlehttperror(
+                    res.status = hgwebcommon.statusmessage(404)
-                        hgwebcommon.ErrorResponse(hgwebcommon.HTTP_NOT_FOUND), wsgireq,
+                    res.headers['Content-Type'] = HGTYPE
-                        req)
+                    # TODO This is not a good response to issue for this request. This
+                    # is mostly for BC for now.
-                    return True, res
+                    res.setbodybytes('0\n%s\n' % b'Not Found')
+                    return True
                 proto = httpv1protocolhandler(wsgireq, req, repo.ui,
                                               lambda perm: checkperm(rctx, wsgireq, perm))
                 # exception here. So consider refactoring into a exception type that
                 # is associated with the wire protocol.
                 try:
-                    res = _callhttp(repo, wsgireq, req, proto, cmd)
+                    _callhttp(repo, wsgireq, req, res, proto, cmd)
                 except hgwebcommon.ErrorResponse as e:
-                    res = _handlehttperror(e, wsgireq, req)
+                    for k, v in e.headers:
+                        res.headers[k] = v
+                    res.status = hgwebcommon.statusmessage(e.code, pycompat.bytestr(e))
+                    # TODO This response body assumes the failed command was
+                    # "unbundle." That assumption is not always valid.
+                    res.setbodybytes('0\n%s\n' % pycompat.bytestr(e))
-                return True, res
+                return True
             def _httpresponsetype(ui, req, prefer_uncompressed):
                 """Determine the appropriate response type and compression settings.
                 opts = {'level': ui.configint('server', 'zliblevel')}
                 return HGTYPE, util.compengines['zlib'], opts
-            def _callhttp(repo, wsgireq, req, proto, cmd):
+            def _callhttp(repo, wsgireq, req, res, proto, cmd):
+                # Avoid cycle involving hg module.
+                from .hgweb import common as hgwebcommon
                 def genversion2(gen, engine, engineopts):
                     # application/mercurial-0.2 always sends a payload header
                     # identifying the compression engine.
                     for chunk in gen:
                         yield chunk
+                def setresponse(code, contenttype, bodybytes=None, bodygen=None):
+                    if code == HTTP_OK:
+                        res.status = '200 Script output follows'
+                    else:
+                        res.status = hgwebcommon.statusmessage(code)
+                    res.headers['Content-Type'] = contenttype
+                    if bodybytes is not None:
+                        res.setbodybytes(bodybytes)
+                    if bodygen is not None:
+                        res.setbodygen(bodygen)
                 if not wireproto.commands.commandavailable(cmd, proto):
-                    wsgireq.respond(HTTP_OK, HGERRTYPE,
+                    setresponse(HTTP_OK, HGERRTYPE,
-                                    body=_('requested wire protocol command is not '
+                                _('requested wire protocol command is not available over '
-                                           'available over HTTP'))
+                                  'HTTP'))
-                    return []
+                    return
                 proto.checkperm(wireproto.commands[cmd].permission)
                 rsp = wireproto.dispatch(repo, proto, cmd)
                 if isinstance(rsp, bytes):
-                    wsgireq.respond(HTTP_OK, HGTYPE, body=rsp)
+                    setresponse(HTTP_OK, HGTYPE, bodybytes=rsp)
-                    return []
                 elif isinstance(rsp, wireprototypes.bytesresponse):
-                    wsgireq.respond(HTTP_OK, HGTYPE, body=rsp.data)
+                    setresponse(HTTP_OK, HGTYPE, bodybytes=rsp.data)
-                    return []
                 elif isinstance(rsp, wireprototypes.streamreslegacy):
-                    gen = rsp.gen
+                    setresponse(HTTP_OK, HGTYPE, bodygen=rsp.gen)
-                    wsgireq.respond(HTTP_OK, HGTYPE)
-                    return gen
                 elif isinstance(rsp, wireprototypes.streamres):
                     gen = rsp.gen
                     if mediatype == HGTYPE2:
                         gen = genversion2(gen, engine, engineopts)
-                    wsgireq.respond(HTTP_OK, mediatype)
+                    setresponse(HTTP_OK, mediatype, bodygen=gen)
-                    return gen
                 elif isinstance(rsp, wireprototypes.pushres):
                     rsp = '%d\n%s' % (rsp.res, rsp.output)
-                    wsgireq.respond(HTTP_OK, HGTYPE, body=rsp)
+                    setresponse(HTTP_OK, HGTYPE, bodybytes=rsp)
-                    return []
                 elif isinstance(rsp, wireprototypes.pusherr):
                     rsp = '0\n%s\n' % rsp.res
-                    wsgireq.respond(HTTP_OK, HGTYPE, body=rsp)
+                    res.drain = True
-                    return []
+                    setresponse(HTTP_OK, HGTYPE, bodybytes=rsp)
                 elif isinstance(rsp, wireprototypes.ooberror):
-                    rsp = rsp.message
+                    setresponse(HTTP_OK, HGERRTYPE, bodybytes=rsp.message)
-                    wsgireq.respond(HTTP_OK, HGERRTYPE, body=rsp)
+                else:
-                    return []
+                    raise error.ProgrammingError('hgweb.protocol internal failure', rsp)
-                raise error.ProgrammingError('hgweb.protocol internal failure', rsp)
-            def _handlehttperror(e, wsgireq, req):
-                """Called when an ErrorResponse is raised during HTTP request processing."""
-                # TODO This response body assumes the failed command was
-                # "unbundle." That assumption is not always valid.
-                wsgireq.respond(e, HGTYPE, body='0\n%s\n' % pycompat.bytestr(e))
-                return ''
             def _sshv1respondbytes(fout, value):
                 """Send a bytes response for protocol version 1."""

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages