upstream/mercurial-mirror Commit - r36871:2cdf47e1

hgweb: refactor the request draining code...

Gregory Szorc -

r36871:2cdf47e1 default

parent child

mercurial/hgweb/request.py

0 +47 -6

@@ -254,12 +254,6 class wsgirequest(object):
254	self.server_write = None	254	self.server_write = None
255	self.headers = []	255	self.headers = []
256		256
257	def drain(self):
258	'''need to read all data from request, httplib is half-duplex'''
259	length = int(self.env.get('CONTENT_LENGTH') or 0)
260	for s in util.filechunkiter(self.inp, limit=length):
261	pass
262
263	def respond(self, status, type, filename=None, body=None):	257	def respond(self, status, type, filename=None, body=None):
264	if not isinstance(type, str):	258	if not isinstance(type, str):
265	type = pycompat.sysstr(type)	259	type = pycompat.sysstr(type)
@@ -292,6 +286,53 class wsgirequest(object):
292	elif isinstance(status, int):	286	elif isinstance(status, int):
293	status = statusmessage(status)	287	status = statusmessage(status)
294		288
		289	# Various HTTP clients (notably httplib) won't read the HTTP
		290	# response until the HTTP request has been sent in full. If servers
		291	# (us) send a response before the HTTP request has been fully sent,
		292	# the connection may deadlock because neither end is reading.
		293	#
		294	# We work around this by "draining" the request data before
		295	# sending any response in some conditions.
		296	drain = False
		297	close = False
		298
		299	# If the client sent Expect: 100-continue, we assume it is smart
		300	# enough to deal with the server sending a response before reading
		301	# the request. (httplib doesn't do this.)
		302	if self.env.get(r'HTTP_EXPECT', r'').lower() == r'100-continue':
		303	pass
		304	# Only tend to request methods that have bodies. Strictly speaking,
		305	# we should sniff for a body. But this is fine for our existing
		306	# WSGI applications.
		307	elif self.env[r'REQUEST_METHOD'] not in (r'POST', r'PUT'):
		308	pass
		309	else:
		310	# If we don't know how much data to read, there's no guarantee
		311	# that we can drain the request responsibly. The WSGI
		312	# specification only says that servers should ensure the
		313	# input stream doesn't overrun the actual request. So there's
		314	# no guarantee that reading until EOF won't corrupt the stream
		315	# state.
		316	if not isinstance(self.inp, util.cappedreader):
		317	close = True
		318	else:
		319	# We /could/ only drain certain HTTP response codes. But 200
		320	# and non-200 wire protocol responses both require draining.
		321	# Since we have a capped reader in place for all situations
		322	# where we drain, it is safe to read from that stream. We'll
		323	# either do a drain or no-op if we're already at EOF.
		324	drain = True
		325
		326	if close:
		327	self.headers.append((r'Connection', r'Close'))
		328
		329	if drain:
		330	assert isinstance(self.inp, util.cappedreader)
		331	while True:
		332	chunk = self.inp.read(32768)
		333	if not chunk:
		334	break
		335
295	self.server_write = self._start_response(	336	self.server_write = self._start_response(
296	pycompat.sysstr(status), self.headers)	337	pycompat.sysstr(status), self.headers)
297	self._start_response = None	338	self._start_response = None

mercurial/wireprotoserver.py

0 0 -18

@@ -301,9 +301,6 def _callhttp(repo, wsgireq, req, proto,
301	wsgireq.respond(HTTP_OK, HGTYPE, body=rsp)	301	wsgireq.respond(HTTP_OK, HGTYPE, body=rsp)
302	return []	302	return []
303	elif isinstance(rsp, wireprototypes.pusherr):	303	elif isinstance(rsp, wireprototypes.pusherr):
304	# This is the httplib workaround documented in _handlehttperror().
305	wsgireq.drain()
306
307	rsp = '0\n%s\n' % rsp.res	304	rsp = '0\n%s\n' % rsp.res
308	wsgireq.respond(HTTP_OK, HGTYPE, body=rsp)	305	wsgireq.respond(HTTP_OK, HGTYPE, body=rsp)
309	return []	306	return []
@@ -316,21 +313,6 def _callhttp(repo, wsgireq, req, proto,
316	def _handlehttperror(e, wsgireq, req):	313	def _handlehttperror(e, wsgireq, req):
317	"""Called when an ErrorResponse is raised during HTTP request processing."""	314	"""Called when an ErrorResponse is raised during HTTP request processing."""
318		315
319	# Clients using Python's httplib are stateful: the HTTP client
320	# won't process an HTTP response until all request data is
321	# sent to the server. The intent of this code is to ensure
322	# we always read HTTP request data from the client, thus
323	# ensuring httplib transitions to a state that allows it to read
324	# the HTTP response. In other words, it helps prevent deadlocks
325	# on clients using httplib.
326
327	if (req.method == 'POST' and
328	# But not if Expect: 100-continue is being used.
329	(req.headers.get('Expect', '').lower() != '100-continue')):
330	wsgireq.drain()
331	else:
332	wsgireq.headers.append((r'Connection', r'Close'))
333
334	# TODO This response body assumes the failed command was	316	# TODO This response body assumes the failed command was
335	# "unbundle." That assumption is not always valid.	317	# "unbundle." That assumption is not always valid.
336	wsgireq.respond(e, HGTYPE, body='0\n%s\n' % pycompat.bytestr(e))	318	wsgireq.respond(e, HGTYPE, body='0\n%s\n' % pycompat.bytestr(e))

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages