upstream/mercurial-mirror Commit - r36912:b2a3308d

1

# hgweb/request.py - An http request from either CGI or the standalone server.

1

# hgweb/request.py - An http request from either CGI or the standalone server.

2

#

2

#

3

4

5

#

5

#

6

# This software may be used and distributed according to the terms of the

6

# This software may be used and distributed according to the terms of the

7

# GNU General Public License version 2 or any later version.

7

# GNU General Public License version 2 or any later version.

8

9

from __future__ import absolute_import

9

from __future__ import absolute_import

10

11

import errno

11

import errno

12

import socket

12

import socket

13

import wsgiref.headers as wsgiheaders

13

import wsgiref.headers as wsgiheaders

14

#import wsgiref.validate

14

#import wsgiref.validate

15

16

from .common import (

16

from .common import (

17

ErrorResponse,

17

ErrorResponse,

18

statusmessage,

18

statusmessage,

19

)

19

)

20

21

from ..thirdparty import (

21

from ..thirdparty import (

22

attr,

22

attr,

23

)

23

)

24

from .. import (

24

from .. import (

25

error,

25

error,

26

pycompat,

26

pycompat,

27

util,

27

util,

28

)

28

)

29

30

class multidict(object):

30

class multidict(object):

31

"""A dict like object that can store multiple values for a key.

31

"""A dict like object that can store multiple values for a key.

32

33

Used to store parsed request parameters.

33

Used to store parsed request parameters.

34

35

This is inspired by WebOb's class of the same name.

35

This is inspired by WebOb's class of the same name.

36

"""

36

"""

37

def __init__(self):

37

def __init__(self):

38

# Stores (key, value) 2-tuples. This isn't the most efficient. But we

38

# Stores (key, value) 2-tuples. This isn't the most efficient. But we

39

# don't rely on parameters that much, so it shouldn't be a perf issue.

39

# don't rely on parameters that much, so it shouldn't be a perf issue.

40

# we can always add dict for fast lookups.

40

# we can always add dict for fast lookups.

41

self._items = []

41

self._items = []

42

43

def __getitem__(self, key):

43

def __getitem__(self, key):

44

"""Returns the last set value for a key."""

44

"""Returns the last set value for a key."""

45

for k, v in reversed(self._items):

45

for k, v in reversed(self._items):

46

if k == key:

46

if k == key:

47

return v

47

return v

48

49

raise KeyError(key)

49

raise KeyError(key)

50

51

def __setitem__(self, key, value):

51

def __setitem__(self, key, value):

52

"""Replace a values for a key with a new value."""

52

"""Replace a values for a key with a new value."""

53

try:

53

try:

54

del self[key]

54

del self[key]

55

except KeyError:

55

except KeyError:

56

pass

56

pass

57

58

self._items.append((key, value))

58

self._items.append((key, value))

59

60

def __delitem__(self, key):

60

def __delitem__(self, key):

61

"""Delete all values for a key."""

61

"""Delete all values for a key."""

62

oldlen = len(self._items)

62

oldlen = len(self._items)

63

64

self._items[:] = [(k, v) for k, v in self._items if k != key]

64

self._items[:] = [(k, v) for k, v in self._items if k != key]

65

66

if oldlen == len(self._items):

66

if oldlen == len(self._items):

67

raise KeyError(key)

67

raise KeyError(key)

68

69

def __contains__(self, key):

69

def __contains__(self, key):

70

return any(k == key for k, v in self._items)

70

return any(k == key for k, v in self._items)

71

72

def __len__(self):

72

def __len__(self):

73

return len(self._items)

73

return len(self._items)

74

75

def get(self, key, default=None):

75

def get(self, key, default=None):

76

try:

76

try:

77

return self.__getitem__(key)

77

return self.__getitem__(key)

78

except KeyError:

78

except KeyError:

79

return default

79

return default

80

81

def add(self, key, value):

81

def add(self, key, value):

82

"""Add a new value for a key. Does not replace existing values."""

82

"""Add a new value for a key. Does not replace existing values."""

83

self._items.append((key, value))

83

self._items.append((key, value))

84

85

def getall(self, key):

85

def getall(self, key):

86

"""Obtains all values for a key."""

86

"""Obtains all values for a key."""

87

return [v for k, v in self._items if k == key]

87

return [v for k, v in self._items if k == key]

88

89

def getone(self, key):

89

def getone(self, key):

90

"""Obtain a single value for a key.

90

"""Obtain a single value for a key.

91

92

Raises KeyError if key not defined or it has multiple values set.

92

Raises KeyError if key not defined or it has multiple values set.

93

"""

93

"""

94

vals = self.getall(key)

94

vals = self.getall(key)

95

96

if not vals:

96

if not vals:

97

raise KeyError(key)

97

raise KeyError(key)

98

99

if len(vals) > 1:

99

if len(vals) > 1:

100

raise KeyError('multiple values for %r' % key)

100

raise KeyError('multiple values for %r' % key)

101

102

return vals[0]

102

return vals[0]

103

104

def asdictoflists(self):

104

def asdictoflists(self):

105

d = {}

105

d = {}

106

for k, v in self._items:

106

for k, v in self._items:

107

if k in d:

107

if k in d:

108

d[k].append(v)

108

d[k].append(v)

109

else:

109

else:

110

d[k] = [v]

110

d[k] = [v]

111

112

return d

112

return d

113

114

@attr.s(frozen=True)

114

@attr.s(frozen=True)

115

class parsedrequest(object):

115

class parsedrequest(object):

116

"""Represents a parsed WSGI request.

116

"""Represents a parsed WSGI request.

117

118

Contains both parsed parameters as well as a handle on the input stream.

118

Contains both parsed parameters as well as a handle on the input stream.

119

"""

119

"""

120

121

# Request method.

121

# Request method.

122

method = attr.ib()

122

method = attr.ib()

123

# Full URL for this request.

123

# Full URL for this request.

124

url = attr.ib()

124

url = attr.ib()

125

# URL without any path components. Just <proto>://<host><port>.

125

# URL without any path components. Just <proto>://<host><port>.

126

baseurl = attr.ib()

126

baseurl = attr.ib()

127

# Advertised URL. Like ``url`` and ``baseurl`` but uses SERVER_NAME instead

127

# Advertised URL. Like ``url`` and ``baseurl`` but uses SERVER_NAME instead

128

# of HTTP: Host header for hostname. This is likely what clients used.

128

# of HTTP: Host header for hostname. This is likely what clients used.

129

advertisedurl = attr.ib()

129

advertisedurl = attr.ib()

130

advertisedbaseurl = attr.ib()

130

advertisedbaseurl = attr.ib()

131

# URL scheme (part before ``://``). e.g. ``http`` or ``https``.

131

# URL scheme (part before ``://``). e.g. ``http`` or ``https``.

132

urlscheme = attr.ib()

132

urlscheme = attr.ib()

133

# Value of REMOTE_USER, if set, or None.

133

# Value of REMOTE_USER, if set, or None.

134

remoteuser = attr.ib()

134

remoteuser = attr.ib()

135

# Value of REMOTE_HOST, if set, or None.

135

# Value of REMOTE_HOST, if set, or None.

136

remotehost = attr.ib()

136

remotehost = attr.ib()

137

# WSGI application path.

137

# WSGI application path.

138

apppath = attr.ib()

138

apppath = attr.ib()

139

# List of path parts to be used for dispatch.

139

# List of path parts to be used for dispatch.

140

dispatchparts = attr.ib()

140

dispatchparts = attr.ib()

141

# URL path component (no query string) used for dispatch.

141

# URL path component (no query string) used for dispatch.

142

dispatchpath = attr.ib()

142

dispatchpath = attr.ib()

143

# Whether there is a path component to this request. This can be true

143

# Whether there is a path component to this request. This can be true

144

# when ``dispatchpath`` is empty due to REPO_NAME muckery.

144

# when ``dispatchpath`` is empty due to REPO_NAME muckery.

145

havepathinfo = attr.ib()

145

havepathinfo = attr.ib()

146

# The name of the repository being accessed.

146

# The name of the repository being accessed.

147

reponame = attr.ib()

147

reponame = attr.ib()

148

# Raw query string (part after "?" in URL).

148

# Raw query string (part after "?" in URL).

149

querystring = attr.ib()

149

querystring = attr.ib()

150

# multidict of query string parameters.

150

# multidict of query string parameters.

151

qsparams = attr.ib()

151

qsparams = attr.ib()

152

# wsgiref.headers.Headers instance. Operates like a dict with case

152

# wsgiref.headers.Headers instance. Operates like a dict with case

153

# insensitive keys.

153

# insensitive keys.

154

headers = attr.ib()

154

headers = attr.ib()

155

# Request body input stream.

155

# Request body input stream.

156

bodyfh = attr.ib()

156

bodyfh = attr.ib()

157

158

def parserequestfromenv(env, bodyfh):

158

def parserequestfromenv(env, bodyfh):

159

"""Parse URL components from environment variables.

159

"""Parse URL components from environment variables.

160

161

WSGI defines request attributes via environment variables. This function

161

WSGI defines request attributes via environment variables. This function

162

parses the environment variables into a data structure.

162

parses the environment variables into a data structure.

163

"""

163

"""

164

# PEP-0333 defines the WSGI spec and is a useful reference for this code.

164

# PEP-0333 defines the WSGI spec and is a useful reference for this code.

165

166

# We first validate that the incoming object conforms with the WSGI spec.

166

# We first validate that the incoming object conforms with the WSGI spec.

167

# We only want to be dealing with spec-conforming WSGI implementations.

167

# We only want to be dealing with spec-conforming WSGI implementations.

168

# TODO enable this once we fix internal violations.

168

# TODO enable this once we fix internal violations.

169

#wsgiref.validate.check_environ(env)

169

#wsgiref.validate.check_environ(env)

170

171

# PEP-0333 states that environment keys and values are native strings

171

# PEP-0333 states that environment keys and values are native strings

172

# (bytes on Python 2 and str on Python 3). The code points for the Unicode

172

# (bytes on Python 2 and str on Python 3). The code points for the Unicode

173

# strings on Python 3 must be between \00000-\000FF. We deal with bytes

173

# strings on Python 3 must be between \00000-\000FF. We deal with bytes

174

# in Mercurial, so mass convert string keys and values to bytes.

174

# in Mercurial, so mass convert string keys and values to bytes.

175

if pycompat.ispy3:

175

if pycompat.ispy3:

176

env = {k.encode('latin-1'): v for k, v in env.iteritems()}

176

env = {k.encode('latin-1'): v for k, v in env.iteritems()}

177

env = {k: v.encode('latin-1') if isinstance(v, str) else v

177

env = {k: v.encode('latin-1') if isinstance(v, str) else v

178

for k, v in env.iteritems()}

178

for k, v in env.iteritems()}

179

180

# https://www.python.org/dev/peps/pep-0333/#environ-variables defines

180

# https://www.python.org/dev/peps/pep-0333/#environ-variables defines

181

# the environment variables.

181

# the environment variables.

182

# https://www.python.org/dev/peps/pep-0333/#url-reconstruction defines

182

# https://www.python.org/dev/peps/pep-0333/#url-reconstruction defines

183

# how URLs are reconstructed.

183

# how URLs are reconstructed.

184

fullurl = env['wsgi.url_scheme'] + '://'

184

fullurl = env['wsgi.url_scheme'] + '://'

185

advertisedfullurl = fullurl

185

advertisedfullurl = fullurl

186

187

def addport(s):

187

def addport(s):

188

if env['wsgi.url_scheme'] == 'https':

188

if env['wsgi.url_scheme'] == 'https':

189

if env['SERVER_PORT'] != '443':

189

if env['SERVER_PORT'] != '443':

190

s += ':' + env['SERVER_PORT']

190

s += ':' + env['SERVER_PORT']

191

else:

191

else:

192

if env['SERVER_PORT'] != '80':

192

if env['SERVER_PORT'] != '80':

193

s += ':' + env['SERVER_PORT']

193

s += ':' + env['SERVER_PORT']

194

195

return s

195

return s

196

197

if env.get('HTTP_HOST'):

197

if env.get('HTTP_HOST'):

198

fullurl += env['HTTP_HOST']

198

fullurl += env['HTTP_HOST']

199

else:

199

else:

200

fullurl += env['SERVER_NAME']

200

fullurl += env['SERVER_NAME']

201

fullurl = addport(fullurl)

201

fullurl = addport(fullurl)

202

203

advertisedfullurl += env['SERVER_NAME']

203

advertisedfullurl += env['SERVER_NAME']

204

advertisedfullurl = addport(advertisedfullurl)

204

advertisedfullurl = addport(advertisedfullurl)

205

206

baseurl = fullurl

206

baseurl = fullurl

207

advertisedbaseurl = advertisedfullurl

207

advertisedbaseurl = advertisedfullurl

208

209

fullurl += util.urlreq.quote(env.get('SCRIPT_NAME', ''))

209

fullurl += util.urlreq.quote(env.get('SCRIPT_NAME', ''))

210

advertisedfullurl += util.urlreq.quote(env.get('SCRIPT_NAME', ''))

210

advertisedfullurl += util.urlreq.quote(env.get('SCRIPT_NAME', ''))

211

fullurl += util.urlreq.quote(env.get('PATH_INFO', ''))

211

fullurl += util.urlreq.quote(env.get('PATH_INFO', ''))

212

advertisedfullurl += util.urlreq.quote(env.get('PATH_INFO', ''))

212

advertisedfullurl += util.urlreq.quote(env.get('PATH_INFO', ''))

213

214

if env.get('QUERY_STRING'):

214

if env.get('QUERY_STRING'):

215

fullurl += '?' + env['QUERY_STRING']

215

fullurl += '?' + env['QUERY_STRING']

216

advertisedfullurl += '?' + env['QUERY_STRING']

216

advertisedfullurl += '?' + env['QUERY_STRING']

217

218

# When dispatching requests, we look at the URL components (PATH_INFO

218

# When dispatching requests, we look at the URL components (PATH_INFO

219

# and QUERY_STRING) after the application root (SCRIPT_NAME). But hgwebdir

219

# and QUERY_STRING) after the application root (SCRIPT_NAME). But hgwebdir

220

# has the concept of "virtual" repositories. This is defined via REPO_NAME.

220

# has the concept of "virtual" repositories. This is defined via REPO_NAME.

221

# If REPO_NAME is defined, we append it to SCRIPT_NAME to form a new app

221

# If REPO_NAME is defined, we append it to SCRIPT_NAME to form a new app

222

# root. We also exclude its path components from PATH_INFO when resolving

222

# root. We also exclude its path components from PATH_INFO when resolving

223

# the dispatch path.

223

# the dispatch path.

224

225

apppath = env['SCRIPT_NAME']

225

apppath = env.get('SCRIPT_NAME', '')

226

227

if env.get('REPO_NAME'):

227

if env.get('REPO_NAME'):

228

if not apppath.endswith('/'):

228

if not apppath.endswith('/'):

229

apppath += '/'

229

apppath += '/'

230

231

apppath += env.get('REPO_NAME')

231

apppath += env.get('REPO_NAME')

232

233

if 'PATH_INFO' in env:

233

if 'PATH_INFO' in env:

234

dispatchparts = env['PATH_INFO'].strip('/').split('/')

234

dispatchparts = env['PATH_INFO'].strip('/').split('/')

235

236

# Strip out repo parts.

236

# Strip out repo parts.

237

repoparts = env.get('REPO_NAME', '').split('/')

237

repoparts = env.get('REPO_NAME', '').split('/')

238

if dispatchparts[:len(repoparts)] == repoparts:

238

if dispatchparts[:len(repoparts)] == repoparts:

239

dispatchparts = dispatchparts[len(repoparts):]

239

dispatchparts = dispatchparts[len(repoparts):]

240

else:

240

else:

241

dispatchparts = []

241

dispatchparts = []

242

243

dispatchpath = '/'.join(dispatchparts)

243

dispatchpath = '/'.join(dispatchparts)

244

245

querystring = env.get('QUERY_STRING', '')

245

querystring = env.get('QUERY_STRING', '')

246

247

# We store as a list so we have ordering information. We also store as

247

# We store as a list so we have ordering information. We also store as

248

# a dict to facilitate fast lookup.

248

# a dict to facilitate fast lookup.

249

qsparams = multidict()

249

qsparams = multidict()

250

for k, v in util.urlreq.parseqsl(querystring, keep_blank_values=True):

250

for k, v in util.urlreq.parseqsl(querystring, keep_blank_values=True):

251

qsparams.add(k, v)

251

qsparams.add(k, v)

252

253

# HTTP_* keys contain HTTP request headers. The Headers structure should

253

# HTTP_* keys contain HTTP request headers. The Headers structure should

254

# perform case normalization for us. We just rewrite underscore to dash

254

# perform case normalization for us. We just rewrite underscore to dash

255

# so keys match what likely went over the wire.

255

# so keys match what likely went over the wire.

256

headers = []

256

headers = []

257

for k, v in env.iteritems():

257

for k, v in env.iteritems():

258

if k.startswith('HTTP_'):

258

if k.startswith('HTTP_'):

259

headers.append((k[len('HTTP_'):].replace('_', '-'), v))

259

headers.append((k[len('HTTP_'):].replace('_', '-'), v))

260

261

headers = wsgiheaders.Headers(headers)

261

headers = wsgiheaders.Headers(headers)

262

263

# This is kind of a lie because the HTTP header wasn't explicitly

263

# This is kind of a lie because the HTTP header wasn't explicitly

264

# sent. But for all intents and purposes it should be OK to lie about

264

# sent. But for all intents and purposes it should be OK to lie about

265

# this, since a consumer will either either value to determine how many

265

# this, since a consumer will either either value to determine how many

266

# bytes are available to read.

266

# bytes are available to read.

267

if 'CONTENT_LENGTH' in env and 'HTTP_CONTENT_LENGTH' not in env:

267

if 'CONTENT_LENGTH' in env and 'HTTP_CONTENT_LENGTH' not in env:

268

headers['Content-Length'] = env['CONTENT_LENGTH']

268

headers['Content-Length'] = env['CONTENT_LENGTH']

269

270

# TODO do this once we remove wsgirequest.inp, otherwise we could have

270

# TODO do this once we remove wsgirequest.inp, otherwise we could have

271

# multiple readers from the underlying input stream.

271

# multiple readers from the underlying input stream.

272

#bodyfh = env['wsgi.input']

272

#bodyfh = env['wsgi.input']

273

#if 'Content-Length' in headers:

273

#if 'Content-Length' in headers:

274

# bodyfh = util.cappedreader(bodyfh, int(headers['Content-Length']))

274

# bodyfh = util.cappedreader(bodyfh, int(headers['Content-Length']))

275

276

return parsedrequest(method=env['REQUEST_METHOD'],

276

return parsedrequest(method=env['REQUEST_METHOD'],

277

url=fullurl, baseurl=baseurl,

277

url=fullurl, baseurl=baseurl,

278

advertisedurl=advertisedfullurl,

278

advertisedurl=advertisedfullurl,

279

advertisedbaseurl=advertisedbaseurl,

279

advertisedbaseurl=advertisedbaseurl,

280

urlscheme=env['wsgi.url_scheme'],

280

urlscheme=env['wsgi.url_scheme'],

281

remoteuser=env.get('REMOTE_USER'),

281

remoteuser=env.get('REMOTE_USER'),

282

remotehost=env.get('REMOTE_HOST'),

282

remotehost=env.get('REMOTE_HOST'),

283

apppath=apppath,

283

apppath=apppath,

284

dispatchparts=dispatchparts, dispatchpath=dispatchpath,

284

dispatchparts=dispatchparts, dispatchpath=dispatchpath,

285

havepathinfo='PATH_INFO' in env,

285

havepathinfo='PATH_INFO' in env,

286

reponame=env.get('REPO_NAME'),

286

reponame=env.get('REPO_NAME'),

287

querystring=querystring,

287

querystring=querystring,

288

qsparams=qsparams,

288

qsparams=qsparams,

289

headers=headers,

289

headers=headers,

290

bodyfh=bodyfh)

290

bodyfh=bodyfh)

291

292

class offsettrackingwriter(object):

292

class offsettrackingwriter(object):

293

"""A file object like object that is append only and tracks write count.

293

"""A file object like object that is append only and tracks write count.

294

295

Instances are bound to a callable. This callable is called with data

295

Instances are bound to a callable. This callable is called with data

296

whenever a ``write()`` is attempted.

296

whenever a ``write()`` is attempted.

297

298

Instances track the amount of written data so they can answer ``tell()``

298

Instances track the amount of written data so they can answer ``tell()``

299

requests.

299

requests.

300

301

The intent of this class is to wrap the ``write()`` function returned by

301

The intent of this class is to wrap the ``write()`` function returned by

302

a WSGI ``start_response()`` function. Since ``write()`` is a callable and

302

a WSGI ``start_response()`` function. Since ``write()`` is a callable and

303

not a file object, it doesn't implement other file object methods.

303

not a file object, it doesn't implement other file object methods.

304

"""

304

"""

305

def __init__(self, writefn):

305

def __init__(self, writefn):

306

self._write = writefn

306

self._write = writefn

307

self._offset = 0

307

self._offset = 0

308

309

def write(self, s):

309

def write(self, s):

310

res = self._write(s)

310

res = self._write(s)

311

# Some Python objects don't report the number of bytes written.

311

# Some Python objects don't report the number of bytes written.

312

if res is None:

312

if res is None:

313

self._offset += len(s)

313

self._offset += len(s)

314

else:

314

else:

315

self._offset += res

315

self._offset += res

316

317

def flush(self):

317

def flush(self):

318

pass

318

pass

319

320

def tell(self):

320

def tell(self):

321

return self._offset

321

return self._offset

322

323

class wsgiresponse(object):

323

class wsgiresponse(object):

324

"""Represents a response to a WSGI request.

324

"""Represents a response to a WSGI request.

325

326

A response consists of a status line, headers, and a body.

326

A response consists of a status line, headers, and a body.

327

328

Consumers must populate the ``status`` and ``headers`` fields and

328

Consumers must populate the ``status`` and ``headers`` fields and

329

make a call to a ``setbody*()`` method before the response can be

329

make a call to a ``setbody*()`` method before the response can be

330

issued.

330

issued.

331

332

When it is time to start sending the response over the wire,

332

When it is time to start sending the response over the wire,

333

``sendresponse()`` is called. It handles emitting the header portion

333

``sendresponse()`` is called. It handles emitting the header portion

334

of the response message. It then yields chunks of body data to be

334

of the response message. It then yields chunks of body data to be

335

written to the peer. Typically, the WSGI application itself calls

335

written to the peer. Typically, the WSGI application itself calls

336

and returns the value from ``sendresponse()``.

336

and returns the value from ``sendresponse()``.

337

"""

337

"""

338

339

def __init__(self, req, startresponse):

339

def __init__(self, req, startresponse):

340

"""Create an empty response tied to a specific request.

340

"""Create an empty response tied to a specific request.

341

342

``req`` is a ``parsedrequest``. ``startresponse`` is the

342

``req`` is a ``parsedrequest``. ``startresponse`` is the

343

``start_response`` function passed to the WSGI application.

343

``start_response`` function passed to the WSGI application.

344

"""

344

"""

345

self._req = req

345

self._req = req

346

self._startresponse = startresponse

346

self._startresponse = startresponse

347

348

self.status = None

348

self.status = None

349

self.headers = wsgiheaders.Headers([])

349

self.headers = wsgiheaders.Headers([])

350

351

self._bodybytes = None

351

self._bodybytes = None

352

self._bodygen = None

352

self._bodygen = None

353

self._bodywillwrite = False

353

self._bodywillwrite = False

354

self._started = False

354

self._started = False

355

self._bodywritefn = None

355

self._bodywritefn = None

356

357

def _verifybody(self):

357

def _verifybody(self):

358

if (self._bodybytes is not None or self._bodygen is not None

358

if (self._bodybytes is not None or self._bodygen is not None

359

or self._bodywillwrite):

359

or self._bodywillwrite):

360

raise error.ProgrammingError('cannot define body multiple times')

360

raise error.ProgrammingError('cannot define body multiple times')

361

362

def setbodybytes(self, b):

362

def setbodybytes(self, b):

363

"""Define the response body as static bytes.

363

"""Define the response body as static bytes.

364

365

The empty string signals that there is no response body.

365

The empty string signals that there is no response body.

366

"""

366

"""

367

self._verifybody()

367

self._verifybody()

368

self._bodybytes = b

368

self._bodybytes = b

369

self.headers['Content-Length'] = '%d' % len(b)

369

self.headers['Content-Length'] = '%d' % len(b)

370

371

def setbodygen(self, gen):

371

def setbodygen(self, gen):

372

"""Define the response body as a generator of bytes."""

372

"""Define the response body as a generator of bytes."""

373

self._verifybody()

373

self._verifybody()

374

self._bodygen = gen

374

self._bodygen = gen

375

376

def setbodywillwrite(self):

376

def setbodywillwrite(self):

377

"""Signal an intent to use write() to emit the response body.

377

"""Signal an intent to use write() to emit the response body.

378

379

**This is the least preferred way to send a body.**

379

**This is the least preferred way to send a body.**

380

381

It is preferred for WSGI applications to emit a generator of chunks

381

It is preferred for WSGI applications to emit a generator of chunks

382

constituting the response body. However, some consumers can't emit

382

constituting the response body. However, some consumers can't emit

383

data this way. So, WSGI provides a way to obtain a ``write(data)``

383

data this way. So, WSGI provides a way to obtain a ``write(data)``

384

function that can be used to synchronously perform an unbuffered

384

function that can be used to synchronously perform an unbuffered

385

write.

385

write.

386

387

Calling this function signals an intent to produce the body in this

387

Calling this function signals an intent to produce the body in this

388

manner.

388

manner.

389

"""

389

"""

390

self._verifybody()

390

self._verifybody()

391

self._bodywillwrite = True

391

self._bodywillwrite = True

392

393

def sendresponse(self):

393

def sendresponse(self):

394

"""Send the generated response to the client.

394

"""Send the generated response to the client.

395

396

Before this is called, ``status`` must be set and one of

396

Before this is called, ``status`` must be set and one of

397

``setbodybytes()`` or ``setbodygen()`` must be called.

397

``setbodybytes()`` or ``setbodygen()`` must be called.

398

399

Calling this method multiple times is not allowed.

399

Calling this method multiple times is not allowed.

400

"""

400

"""

401

if self._started:

401

if self._started:

402

raise error.ProgrammingError('sendresponse() called multiple times')

402

raise error.ProgrammingError('sendresponse() called multiple times')

403

404

self._started = True

404

self._started = True

405

406

if not self.status:

406

if not self.status:

407

raise error.ProgrammingError('status line not defined')

407

raise error.ProgrammingError('status line not defined')

408

409

if (self._bodybytes is None and self._bodygen is None

409

if (self._bodybytes is None and self._bodygen is None

410

and not self._bodywillwrite):

410

and not self._bodywillwrite):

411

raise error.ProgrammingError('response body not defined')

411

raise error.ProgrammingError('response body not defined')

412

413

# RFC 7232 Section 4.1 states that a 304 MUST generate one of

413

# RFC 7232 Section 4.1 states that a 304 MUST generate one of

414

# {Cache-Control, Content-Location, Date, ETag, Expires, Vary}

414

# {Cache-Control, Content-Location, Date, ETag, Expires, Vary}

415

# and SHOULD NOT generate other headers unless they could be used

415

# and SHOULD NOT generate other headers unless they could be used

416

# to guide cache updates. Furthermore, RFC 7230 Section 3.3.2

416

# to guide cache updates. Furthermore, RFC 7230 Section 3.3.2

417

# states that no response body can be issued. Content-Length can

417

# states that no response body can be issued. Content-Length can

418

# be sent. But if it is present, it should be the size of the response

418

# be sent. But if it is present, it should be the size of the response

419

# that wasn't transferred.

419

# that wasn't transferred.

420

if self.status.startswith('304 '):

420

if self.status.startswith('304 '):

421

# setbodybytes('') will set C-L to 0. This doesn't conform with the

421

# setbodybytes('') will set C-L to 0. This doesn't conform with the

422

# spec. So remove it.

422

# spec. So remove it.

423

if self.headers.get('Content-Length') == '0':

423

if self.headers.get('Content-Length') == '0':

424

del self.headers['Content-Length']

424

del self.headers['Content-Length']

425

426

# Strictly speaking, this is too strict. But until it causes

426

# Strictly speaking, this is too strict. But until it causes

427

# problems, let's be strict.

427

# problems, let's be strict.

428

badheaders = {k for k in self.headers.keys()

428

badheaders = {k for k in self.headers.keys()

429

if k.lower() not in ('date', 'etag', 'expires',

429

if k.lower() not in ('date', 'etag', 'expires',

430

'cache-control',

430

'cache-control',

431

'content-location',

431

'content-location',

432

'vary')}

432

'vary')}

433

if badheaders:

433

if badheaders:

434

raise error.ProgrammingError(

434

raise error.ProgrammingError(

435

'illegal header on 304 response: %s' %

435

'illegal header on 304 response: %s' %

436

', '.join(sorted(badheaders)))

436

', '.join(sorted(badheaders)))

437

438

if self._bodygen is not None or self._bodywillwrite:

438

if self._bodygen is not None or self._bodywillwrite:

439

raise error.ProgrammingError("must use setbodybytes('') with "

439

raise error.ProgrammingError("must use setbodybytes('') with "

440

"304 responses")

440

"304 responses")

441

442

# Various HTTP clients (notably httplib) won't read the HTTP response

442

# Various HTTP clients (notably httplib) won't read the HTTP response

443

# until the HTTP request has been sent in full. If servers (us) send a

443

# until the HTTP request has been sent in full. If servers (us) send a

444

# response before the HTTP request has been fully sent, the connection

444

# response before the HTTP request has been fully sent, the connection

445

# may deadlock because neither end is reading.

445

# may deadlock because neither end is reading.

446

#

446

#

447

# We work around this by "draining" the request data before

447

# We work around this by "draining" the request data before

448

# sending any response in some conditions.

448

# sending any response in some conditions.

449

drain = False

449

drain = False

450

close = False

450

close = False

451

452

# If the client sent Expect: 100-continue, we assume it is smart enough

452

# If the client sent Expect: 100-continue, we assume it is smart enough

453

# to deal with the server sending a response before reading the request.

453

# to deal with the server sending a response before reading the request.

454

# (httplib doesn't do this.)

454

# (httplib doesn't do this.)

455

if self._req.headers.get('Expect', '').lower() == '100-continue':

455

if self._req.headers.get('Expect', '').lower() == '100-continue':

456

pass

456

pass

457

# Only tend to request methods that have bodies. Strictly speaking,

457

# Only tend to request methods that have bodies. Strictly speaking,

458

# we should sniff for a body. But this is fine for our existing

458

# we should sniff for a body. But this is fine for our existing

459

# WSGI applications.

459

# WSGI applications.

460

elif self._req.method not in ('POST', 'PUT'):

460

elif self._req.method not in ('POST', 'PUT'):

461

pass

461

pass

462

else:

462

else:

463

# If we don't know how much data to read, there's no guarantee

463

# If we don't know how much data to read, there's no guarantee

464

# that we can drain the request responsibly. The WSGI

464

# that we can drain the request responsibly. The WSGI

465

# specification only says that servers *should* ensure the

465

# specification only says that servers *should* ensure the

466

# input stream doesn't overrun the actual request. So there's

466

# input stream doesn't overrun the actual request. So there's

467

# no guarantee that reading until EOF won't corrupt the stream

467

# no guarantee that reading until EOF won't corrupt the stream

468

# state.

468

# state.

469

if not isinstance(self._req.bodyfh, util.cappedreader):

469

if not isinstance(self._req.bodyfh, util.cappedreader):

470

close = True

470

close = True

471

else:

471

else:

472

# We /could/ only drain certain HTTP response codes. But 200 and

472

# We /could/ only drain certain HTTP response codes. But 200 and

473

# non-200 wire protocol responses both require draining. Since

473

# non-200 wire protocol responses both require draining. Since

474

# we have a capped reader in place for all situations where we

474

# we have a capped reader in place for all situations where we

475

# drain, it is safe to read from that stream. We'll either do

475

# drain, it is safe to read from that stream. We'll either do

476

# a drain or no-op if we're already at EOF.

476

# a drain or no-op if we're already at EOF.

477

drain = True

477

drain = True

478

479

if close:

479

if close:

480

self.headers['Connection'] = 'Close'

480

self.headers['Connection'] = 'Close'

481

482

if drain:

482

if drain:

483

assert isinstance(self._req.bodyfh, util.cappedreader)

483

assert isinstance(self._req.bodyfh, util.cappedreader)

484

while True:

484

while True:

485

chunk = self._req.bodyfh.read(32768)

485

chunk = self._req.bodyfh.read(32768)

486

if not chunk:

486

if not chunk:

487

break

487

break

488

489

write = self._startresponse(pycompat.sysstr(self.status),

489

write = self._startresponse(pycompat.sysstr(self.status),

490

self.headers.items())

490

self.headers.items())

491

492

if self._bodybytes:

492

if self._bodybytes:

493

yield self._bodybytes

493

yield self._bodybytes

494

elif self._bodygen:

494

elif self._bodygen:

495

for chunk in self._bodygen:

495

for chunk in self._bodygen:

496

yield chunk

496

yield chunk

497

elif self._bodywillwrite:

497

elif self._bodywillwrite:

498

self._bodywritefn = write

498

self._bodywritefn = write

499

else:

499

else:

500

error.ProgrammingError('do not know how to send body')

500

error.ProgrammingError('do not know how to send body')

501

502

def getbodyfile(self):

502

def getbodyfile(self):

503

"""Obtain a file object like object representing the response body.

503

"""Obtain a file object like object representing the response body.

504

505

For this to work, you must call ``setbodywillwrite()`` and then

505

For this to work, you must call ``setbodywillwrite()`` and then

506

``sendresponse()`` first. ``sendresponse()`` is a generator and the

506

``sendresponse()`` first. ``sendresponse()`` is a generator and the

507

function won't run to completion unless the generator is advanced. The

507

function won't run to completion unless the generator is advanced. The

508

generator yields not items. The easiest way to consume it is with

508

generator yields not items. The easiest way to consume it is with

509

``list(res.sendresponse())``, which should resolve to an empty list -

509

``list(res.sendresponse())``, which should resolve to an empty list -

510

``[]``.

510

``[]``.

511

"""

511

"""

512

if not self._bodywillwrite:

512

if not self._bodywillwrite:

513

raise error.ProgrammingError('must call setbodywillwrite() first')

513

raise error.ProgrammingError('must call setbodywillwrite() first')

514

515

if not self._started:

515

if not self._started:

516

raise error.ProgrammingError('must call sendresponse() first; did '

516

raise error.ProgrammingError('must call sendresponse() first; did '

517

'you remember to consume it since it '

517

'you remember to consume it since it '

518

'is a generator?')

518

'is a generator?')

519

520

assert self._bodywritefn

520

assert self._bodywritefn

521

return offsettrackingwriter(self._bodywritefn)

521

return offsettrackingwriter(self._bodywritefn)

522

523

class wsgirequest(object):

523

class wsgirequest(object):

524

"""Higher-level API for a WSGI request.

524

"""Higher-level API for a WSGI request.

525

526

WSGI applications are invoked with 2 arguments. They are used to

526

WSGI applications are invoked with 2 arguments. They are used to

527

instantiate instances of this class, which provides higher-level APIs

527

instantiate instances of this class, which provides higher-level APIs

528

for obtaining request parameters, writing HTTP output, etc.

528

for obtaining request parameters, writing HTTP output, etc.

529

"""

529

"""

530

def __init__(self, wsgienv, start_response):

530

def __init__(self, wsgienv, start_response):

531

version = wsgienv[r'wsgi.version']

531

version = wsgienv[r'wsgi.version']

532

if (version < (1, 0)) or (version >= (2, 0)):

532

if (version < (1, 0)) or (version >= (2, 0)):

533

raise RuntimeError("Unknown and unsupported WSGI version %d.%d"

533

raise RuntimeError("Unknown and unsupported WSGI version %d.%d"

534

% version)

534

% version)

535

536

inp = wsgienv[r'wsgi.input']

536

inp = wsgienv[r'wsgi.input']

537

538

if r'HTTP_CONTENT_LENGTH' in wsgienv:

538

if r'HTTP_CONTENT_LENGTH' in wsgienv:

539

inp = util.cappedreader(inp, int(wsgienv[r'HTTP_CONTENT_LENGTH']))

539

inp = util.cappedreader(inp, int(wsgienv[r'HTTP_CONTENT_LENGTH']))

540

elif r'CONTENT_LENGTH' in wsgienv:

540

elif r'CONTENT_LENGTH' in wsgienv:

541

inp = util.cappedreader(inp, int(wsgienv[r'CONTENT_LENGTH']))

541

inp = util.cappedreader(inp, int(wsgienv[r'CONTENT_LENGTH']))

542

543

self.err = wsgienv[r'wsgi.errors']

543

self.err = wsgienv[r'wsgi.errors']

544

self.threaded = wsgienv[r'wsgi.multithread']

544

self.threaded = wsgienv[r'wsgi.multithread']

545

self.multiprocess = wsgienv[r'wsgi.multiprocess']

545

self.multiprocess = wsgienv[r'wsgi.multiprocess']

546

self.run_once = wsgienv[r'wsgi.run_once']

546

self.run_once = wsgienv[r'wsgi.run_once']

547

self.env = wsgienv

547

self.env = wsgienv

548

self.req = parserequestfromenv(wsgienv, inp)

548

self.req = parserequestfromenv(wsgienv, inp)

549

self.res = wsgiresponse(self.req, start_response)

549

self.res = wsgiresponse(self.req, start_response)

550

self._start_response = start_response

550

self._start_response = start_response

551

self.server_write = None

551

self.server_write = None

552

self.headers = []

552

self.headers = []

553

554

def respond(self, status, type, filename=None, body=None):

554

def respond(self, status, type, filename=None, body=None):

555

if not isinstance(type, str):

555

if not isinstance(type, str):

556

type = pycompat.sysstr(type)

556

type = pycompat.sysstr(type)

557

if self._start_response is not None:

557

if self._start_response is not None:

558

self.headers.append((r'Content-Type', type))

558

self.headers.append((r'Content-Type', type))

559

if filename:

559

if filename:

560

filename = (filename.rpartition('/')[-1]

560

filename = (filename.rpartition('/')[-1]

561

.replace('\\', '\\\\').replace('"', '\\"'))

561

.replace('\\', '\\\\').replace('"', '\\"'))

562

self.headers.append(('Content-Disposition',

562

self.headers.append(('Content-Disposition',

563

'inline; filename="%s"' % filename))

563

'inline; filename="%s"' % filename))

564

if body is not None:

564

if body is not None:

565

self.headers.append((r'Content-Length', str(len(body))))

565

self.headers.append((r'Content-Length', str(len(body))))

566

567

for k, v in self.headers:

567

for k, v in self.headers:

568

if not isinstance(v, str):

568

if not isinstance(v, str):

569

raise TypeError('header value must be string: %r' % (v,))

569

raise TypeError('header value must be string: %r' % (v,))

570

571

if isinstance(status, ErrorResponse):

571

if isinstance(status, ErrorResponse):

572

self.headers.extend(status.headers)

572

self.headers.extend(status.headers)

573

status = statusmessage(status.code, pycompat.bytestr(status))

573

status = statusmessage(status.code, pycompat.bytestr(status))

574

elif status == 200:

574

elif status == 200:

575

status = '200 Script output follows'

575

status = '200 Script output follows'

576

elif isinstance(status, int):

576

elif isinstance(status, int):

577

status = statusmessage(status)

577

status = statusmessage(status)

578

579

# Various HTTP clients (notably httplib) won't read the HTTP

579

# Various HTTP clients (notably httplib) won't read the HTTP

580

# response until the HTTP request has been sent in full. If servers

580

# response until the HTTP request has been sent in full. If servers

581

# (us) send a response before the HTTP request has been fully sent,

581

# (us) send a response before the HTTP request has been fully sent,

582

# the connection may deadlock because neither end is reading.

582

# the connection may deadlock because neither end is reading.

583

#

583

#

584

# We work around this by "draining" the request data before

584

# We work around this by "draining" the request data before

585

# sending any response in some conditions.

585

# sending any response in some conditions.

586

drain = False

586

drain = False

587

close = False

587

close = False

588

589

# If the client sent Expect: 100-continue, we assume it is smart

589

# If the client sent Expect: 100-continue, we assume it is smart

590

# enough to deal with the server sending a response before reading

590

# enough to deal with the server sending a response before reading

591

# the request. (httplib doesn't do this.)

591

# the request. (httplib doesn't do this.)

592

if self.env.get(r'HTTP_EXPECT', r'').lower() == r'100-continue':

592

if self.env.get(r'HTTP_EXPECT', r'').lower() == r'100-continue':

593

pass

593

pass

594

# Only tend to request methods that have bodies. Strictly speaking,

594

# Only tend to request methods that have bodies. Strictly speaking,

595

# we should sniff for a body. But this is fine for our existing

595

# we should sniff for a body. But this is fine for our existing

596

# WSGI applications.

596

# WSGI applications.

597

elif self.env[r'REQUEST_METHOD'] not in (r'POST', r'PUT'):

597

elif self.env[r'REQUEST_METHOD'] not in (r'POST', r'PUT'):

598

pass

598

pass

599

else:

599

else:

600

# If we don't know how much data to read, there's no guarantee

600

# If we don't know how much data to read, there's no guarantee

601

# that we can drain the request responsibly. The WSGI

601

# that we can drain the request responsibly. The WSGI

602

# specification only says that servers *should* ensure the

602

# specification only says that servers *should* ensure the

603

# input stream doesn't overrun the actual request. So there's

603

# input stream doesn't overrun the actual request. So there's

604

# no guarantee that reading until EOF won't corrupt the stream

604

# no guarantee that reading until EOF won't corrupt the stream

605

# state.

605

# state.

606

if not isinstance(self.req.bodyfh, util.cappedreader):

606

if not isinstance(self.req.bodyfh, util.cappedreader):

607

close = True

607

close = True

608

else:

608

else:

609

# We /could/ only drain certain HTTP response codes. But 200

609

# We /could/ only drain certain HTTP response codes. But 200

610

# and non-200 wire protocol responses both require draining.

610

# and non-200 wire protocol responses both require draining.

611

# Since we have a capped reader in place for all situations

611

# Since we have a capped reader in place for all situations

612

# where we drain, it is safe to read from that stream. We'll

612

# where we drain, it is safe to read from that stream. We'll

613

# either do a drain or no-op if we're already at EOF.

613

# either do a drain or no-op if we're already at EOF.

614

drain = True

614

drain = True

615

616

if close:

616

if close:

617

self.headers.append((r'Connection', r'Close'))

617

self.headers.append((r'Connection', r'Close'))

618

619

if drain:

619

if drain:

620

assert isinstance(self.req.bodyfh, util.cappedreader)

620

assert isinstance(self.req.bodyfh, util.cappedreader)

621

while True:

621

while True:

622

chunk = self.req.bodyfh.read(32768)

622

chunk = self.req.bodyfh.read(32768)

623

if not chunk:

623

if not chunk:

624

break

624

break

625

626

self.server_write = self._start_response(

626

self.server_write = self._start_response(

627

pycompat.sysstr(status), self.headers)

627

pycompat.sysstr(status), self.headers)

628

self._start_response = None

628

self._start_response = None

629

self.headers = []

629

self.headers = []

630

if body is not None:

630

if body is not None:

631

self.write(body)

631

self.write(body)

632

self.server_write = None

632

self.server_write = None

633

634

def write(self, thing):

634

def write(self, thing):

635

if thing:

635

if thing:

636

try:

636

try:

637

self.server_write(thing)

637

self.server_write(thing)

638

except socket.error as inst:

638

except socket.error as inst:

639

if inst[0] != errno.ECONNRESET:

639

if inst[0] != errno.ECONNRESET:

640

raise

640

raise

641

642

def flush(self):

642

def flush(self):

643

return None

643

return None

644

645

def wsgiapplication(app_maker):

645

def wsgiapplication(app_maker):

646

'''For compatibility with old CGI scripts. A plain hgweb() or hgwebdir()

646

'''For compatibility with old CGI scripts. A plain hgweb() or hgwebdir()

647

can and should now be used as a WSGI application.'''

647

can and should now be used as a WSGI application.'''

648

application = app_maker()

648

application = app_maker()

649

def run_wsgi(env, respond):

649

def run_wsgi(env, respond):

650

return application(env, respond)

650

return application(env, respond)

651

return run_wsgi

651

return run_wsgi

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

@@ -0,0 +1,255 b''
	1	from __future__ import absolute_import, print_function
	2
	3	import unittest
	4
	5	from mercurial.hgweb import (
	6	request as requestmod,
	7	)
	8
	9	DEFAULT_ENV = {
	10	r'REQUEST_METHOD': r'GET',
	11	r'SERVER_NAME': r'testserver',
	12	r'SERVER_PORT': r'80',
	13	r'SERVER_PROTOCOL': r'http',
	14	r'wsgi.version': (1, 0),
	15	r'wsgi.url_scheme': r'http',
	16	r'wsgi.input': None,
	17	r'wsgi.errors': None,
	18	r'wsgi.multithread': False,
	19	r'wsgi.multiprocess': True,
	20	r'wsgi.run_once': False,
	21	}
	22
	23	def parse(env, bodyfh=None, extra=None):
	24	env = dict(env)
	25	env.update(extra or {})
	26
	27	return requestmod.parserequestfromenv(env, bodyfh)
	28
	29	class ParseRequestTests(unittest.TestCase):
	30	def testdefault(self):
	31	r = parse(DEFAULT_ENV)
	32	self.assertEqual(r.url, b'http://testserver')
	33	self.assertEqual(r.baseurl, b'http://testserver')
	34	self.assertEqual(r.advertisedurl, b'http://testserver')
	35	self.assertEqual(r.advertisedbaseurl, b'http://testserver')
	36	self.assertEqual(r.urlscheme, b'http')
	37	self.assertEqual(r.method, b'GET')
	38	self.assertIsNone(r.remoteuser)
	39	self.assertIsNone(r.remotehost)
	40	self.assertEqual(r.apppath, b'')
	41	self.assertEqual(r.dispatchparts, [])
	42	self.assertEqual(r.dispatchpath, b'')
	43	self.assertFalse(r.havepathinfo)
	44	self.assertIsNone(r.reponame)
	45	self.assertEqual(r.querystring, b'')
	46	self.assertEqual(len(r.qsparams), 0)
	47	self.assertEqual(len(r.headers), 0)
	48
	49	def testcustomport(self):
	50	r = parse(DEFAULT_ENV, extra={
	51	r'SERVER_PORT': r'8000',
	52	})
	53
	54	self.assertEqual(r.url, b'http://testserver:8000')
	55	self.assertEqual(r.baseurl, b'http://testserver:8000')
	56	self.assertEqual(r.advertisedurl, b'http://testserver:8000')
	57	self.assertEqual(r.advertisedbaseurl, b'http://testserver:8000')
	58
	59	r = parse(DEFAULT_ENV, extra={
	60	r'SERVER_PORT': r'4000',
	61	r'wsgi.url_scheme': r'https',
	62	})
	63
	64	self.assertEqual(r.url, b'https://testserver:4000')
	65	self.assertEqual(r.baseurl, b'https://testserver:4000')
	66	self.assertEqual(r.advertisedurl, b'https://testserver:4000')
	67	self.assertEqual(r.advertisedbaseurl, b'https://testserver:4000')
	68
	69	def testhttphost(self):
	70	r = parse(DEFAULT_ENV, extra={
	71	r'HTTP_HOST': r'altserver',
	72	})
	73
	74	self.assertEqual(r.url, b'http://altserver')
	75	self.assertEqual(r.baseurl, b'http://altserver')
	76	self.assertEqual(r.advertisedurl, b'http://testserver')
	77	self.assertEqual(r.advertisedbaseurl, b'http://testserver')
	78
	79	def testscriptname(self):
	80	r = parse(DEFAULT_ENV, extra={
	81	r'SCRIPT_NAME': r'',
	82	})
	83
	84	self.assertEqual(r.url, b'http://testserver')
	85	self.assertEqual(r.baseurl, b'http://testserver')
	86	self.assertEqual(r.advertisedurl, b'http://testserver')
	87	self.assertEqual(r.advertisedbaseurl, b'http://testserver')
	88	self.assertEqual(r.apppath, b'')
	89	self.assertEqual(r.dispatchparts, [])
	90	self.assertEqual(r.dispatchpath, b'')
	91	self.assertFalse(r.havepathinfo)
	92
	93	r = parse(DEFAULT_ENV, extra={
	94	r'SCRIPT_NAME': r'/script',
	95	})
	96
	97	self.assertEqual(r.url, b'http://testserver/script')
	98	self.assertEqual(r.baseurl, b'http://testserver')
	99	self.assertEqual(r.advertisedurl, b'http://testserver/script')
	100	self.assertEqual(r.advertisedbaseurl, b'http://testserver')
	101	self.assertEqual(r.apppath, b'/script')
	102	self.assertEqual(r.dispatchparts, [])
	103	self.assertEqual(r.dispatchpath, b'')
	104	self.assertFalse(r.havepathinfo)
	105
	106	r = parse(DEFAULT_ENV, extra={
	107	r'SCRIPT_NAME': r'/multiple words',
	108	})
	109
	110	self.assertEqual(r.url, b'http://testserver/multiple%20words')
	111	self.assertEqual(r.baseurl, b'http://testserver')
	112	self.assertEqual(r.advertisedurl, b'http://testserver/multiple%20words')
	113	self.assertEqual(r.advertisedbaseurl, b'http://testserver')
	114	self.assertEqual(r.apppath, b'/multiple words')
	115	self.assertEqual(r.dispatchparts, [])
	116	self.assertEqual(r.dispatchpath, b'')
	117	self.assertFalse(r.havepathinfo)
	118
	119	def testpathinfo(self):
	120	r = parse(DEFAULT_ENV, extra={
	121	r'PATH_INFO': r'',
	122	})
	123
	124	self.assertEqual(r.url, b'http://testserver')
	125	self.assertEqual(r.baseurl, b'http://testserver')
	126	self.assertEqual(r.advertisedurl, b'http://testserver')
	127	self.assertEqual(r.advertisedbaseurl, b'http://testserver')
	128	self.assertEqual(r.apppath, b'')
	129	self.assertEqual(r.dispatchparts, [])
	130	self.assertEqual(r.dispatchpath, b'')
	131	self.assertTrue(r.havepathinfo)
	132
	133	r = parse(DEFAULT_ENV, extra={
	134	r'PATH_INFO': r'/pathinfo',
	135	})
	136
	137	self.assertEqual(r.url, b'http://testserver/pathinfo')
	138	self.assertEqual(r.baseurl, b'http://testserver')
	139	self.assertEqual(r.advertisedurl, b'http://testserver/pathinfo')
	140	self.assertEqual(r.advertisedbaseurl, b'http://testserver')
	141	self.assertEqual(r.apppath, b'')
	142	self.assertEqual(r.dispatchparts, [b'pathinfo'])
	143	self.assertEqual(r.dispatchpath, b'pathinfo')
	144	self.assertTrue(r.havepathinfo)
	145
	146	r = parse(DEFAULT_ENV, extra={
	147	r'PATH_INFO': r'/one/two/',
	148	})
	149
	150	self.assertEqual(r.url, b'http://testserver/one/two/')
	151	self.assertEqual(r.baseurl, b'http://testserver')
	152	self.assertEqual(r.advertisedurl, b'http://testserver/one/two/')
	153	self.assertEqual(r.advertisedbaseurl, b'http://testserver')
	154	self.assertEqual(r.apppath, b'')
	155	self.assertEqual(r.dispatchparts, [b'one', b'two'])
	156	self.assertEqual(r.dispatchpath, b'one/two')
	157	self.assertTrue(r.havepathinfo)
	158
	159	def testscriptandpathinfo(self):
	160	r = parse(DEFAULT_ENV, extra={
	161	r'SCRIPT_NAME': r'/script',
	162	r'PATH_INFO': r'/pathinfo',
	163	})
	164
	165	self.assertEqual(r.url, b'http://testserver/script/pathinfo')
	166	self.assertEqual(r.baseurl, b'http://testserver')
	167	self.assertEqual(r.advertisedurl, b'http://testserver/script/pathinfo')
	168	self.assertEqual(r.advertisedbaseurl, b'http://testserver')
	169	self.assertEqual(r.apppath, b'/script')
	170	self.assertEqual(r.dispatchparts, [b'pathinfo'])
	171	self.assertEqual(r.dispatchpath, b'pathinfo')
	172	self.assertTrue(r.havepathinfo)
	173
	174	r = parse(DEFAULT_ENV, extra={
	175	r'SCRIPT_NAME': r'/script1/script2',
	176	r'PATH_INFO': r'/path1/path2',
	177	})
	178
	179	self.assertEqual(r.url,
	180	b'http://testserver/script1/script2/path1/path2')
	181	self.assertEqual(r.baseurl, b'http://testserver')
	182	self.assertEqual(r.advertisedurl,
	183	b'http://testserver/script1/script2/path1/path2')
	184	self.assertEqual(r.advertisedbaseurl, b'http://testserver')
	185	self.assertEqual(r.apppath, b'/script1/script2')
	186	self.assertEqual(r.dispatchparts, [b'path1', b'path2'])
	187	self.assertEqual(r.dispatchpath, b'path1/path2')
	188	self.assertTrue(r.havepathinfo)
	189
	190	r = parse(DEFAULT_ENV, extra={
	191	r'HTTP_HOST': r'hostserver',
	192	r'SCRIPT_NAME': r'/script',
	193	r'PATH_INFO': r'/pathinfo',
	194	})
	195
	196	self.assertEqual(r.url, b'http://hostserver/script/pathinfo')
	197	self.assertEqual(r.baseurl, b'http://hostserver')
	198	self.assertEqual(r.advertisedurl, b'http://testserver/script/pathinfo')
	199	self.assertEqual(r.advertisedbaseurl, b'http://testserver')
	200	self.assertEqual(r.apppath, b'/script')
	201	self.assertEqual(r.dispatchparts, [b'pathinfo'])
	202	self.assertEqual(r.dispatchpath, b'pathinfo')
	203	self.assertTrue(r.havepathinfo)
	204
	205	def testreponame(self):
	206	"""REPO_NAME path components get stripped from URL."""
	207	r = parse(DEFAULT_ENV, extra={
	208	r'REPO_NAME': r'repo',
	209	r'PATH_INFO': r'/path1/path2'
	210	})
	211
	212	self.assertEqual(r.url, b'http://testserver/path1/path2')
	213	self.assertEqual(r.baseurl, b'http://testserver')
	214	self.assertEqual(r.advertisedurl, b'http://testserver/path1/path2')
	215	self.assertEqual(r.advertisedbaseurl, b'http://testserver')
	216	self.assertEqual(r.apppath, b'/repo')
	217	self.assertEqual(r.dispatchparts, [b'path1', b'path2'])
	218	self.assertEqual(r.dispatchpath, b'path1/path2')
	219	self.assertTrue(r.havepathinfo)
	220	self.assertEqual(r.reponame, b'repo')
	221
	222	r = parse(DEFAULT_ENV, extra={
	223	r'REPO_NAME': r'repo',
	224	r'PATH_INFO': r'/repo/path1/path2',
	225	})
	226
	227	self.assertEqual(r.url, b'http://testserver/repo/path1/path2')
	228	self.assertEqual(r.baseurl, b'http://testserver')
	229	self.assertEqual(r.advertisedurl, b'http://testserver/repo/path1/path2')
	230	self.assertEqual(r.advertisedbaseurl, b'http://testserver')
	231	self.assertEqual(r.apppath, b'/repo')
	232	self.assertEqual(r.dispatchparts, [b'path1', b'path2'])
	233	self.assertEqual(r.dispatchpath, b'path1/path2')
	234	self.assertTrue(r.havepathinfo)
	235	self.assertEqual(r.reponame, b'repo')
	236
	237	r = parse(DEFAULT_ENV, extra={
	238	r'REPO_NAME': r'prefix/repo',
	239	r'PATH_INFO': r'/prefix/repo/path1/path2',
	240	})
	241
	242	self.assertEqual(r.url, b'http://testserver/prefix/repo/path1/path2')
	243	self.assertEqual(r.baseurl, b'http://testserver')
	244	self.assertEqual(r.advertisedurl,
	245	b'http://testserver/prefix/repo/path1/path2')
	246	self.assertEqual(r.advertisedbaseurl, b'http://testserver')
	247	self.assertEqual(r.apppath, b'/prefix/repo')
	248	self.assertEqual(r.dispatchparts, [b'path1', b'path2'])
	249	self.assertEqual(r.dispatchpath, b'path1/path2')
	250	self.assertTrue(r.havepathinfo)
	251	self.assertEqual(r.reponame, b'prefix/repo')
	252
	253	if __name__ == '__main__':
	254	import silenttestrunner
	255	silenttestrunner.main(__name__)

             # hgweb/request.py - An http request from either CGI or the standalone server.
             #
             # Copyright 21 May 2005 - (c) 2005 Jake Edge <jake@edge2.net>
             # Copyright 2005, 2006 Matt Mackall <mpm@selenic.com>
             #
             # This software may be used and distributed according to the terms of the
             # GNU General Public License version 2 or any later version.
             from __future__ import absolute_import
             import errno
             import socket
             import wsgiref.headers as wsgiheaders
             #import wsgiref.validate
             from .common import (
                 ErrorResponse,
                 statusmessage,
             )
             from ..thirdparty import (
                 attr,
             )
             from .. import (
                 error,
                 pycompat,
                 util,
             )
             class multidict(object):
                 """A dict like object that can store multiple values for a key.
                 Used to store parsed request parameters.
                 This is inspired by WebOb's class of the same name.
                 """
                 def __init__(self):
                     # Stores (key, value) 2-tuples. This isn't the most efficient. But we
                     # don't rely on parameters that much, so it shouldn't be a perf issue.
                     # we can always add dict for fast lookups.
                     self._items = []
                 def __getitem__(self, key):
                     """Returns the last set value for a key."""
                     for k, v in reversed(self._items):
                         if k == key:
                             return v
                     raise KeyError(key)
                 def __setitem__(self, key, value):
                     """Replace a values for a key with a new value."""
                     try:
                         del self[key]
                     except KeyError:
                         pass
                     self._items.append((key, value))
                 def __delitem__(self, key):
                     """Delete all values for a key."""
                     oldlen = len(self._items)
                     self._items[:] = [(k, v) for k, v in self._items if k != key]
                     if oldlen == len(self._items):
                         raise KeyError(key)
                 def __contains__(self, key):
                     return any(k == key for k, v in self._items)
                 def __len__(self):
                     return len(self._items)
                 def get(self, key, default=None):
                     try:
                         return self.__getitem__(key)
                     except KeyError:
                         return default
                 def add(self, key, value):
                     """Add a new value for a key. Does not replace existing values."""
                     self._items.append((key, value))
                 def getall(self, key):
                     """Obtains all values for a key."""
                     return [v for k, v in self._items if k == key]
                 def getone(self, key):
                     """Obtain a single value for a key.
                     Raises KeyError if key not defined or it has multiple values set.
                     """
                     vals = self.getall(key)
                     if not vals:
                         raise KeyError(key)
                     if len(vals) > 1:
                         raise KeyError('multiple values for %r' % key)
                     return vals[0]
                 def asdictoflists(self):
                     d = {}
                     for k, v in self._items:
                         if k in d:
                             d[k].append(v)
                         else:
                             d[k] = [v]
                     return d
             @attr.s(frozen=True)
             class parsedrequest(object):
                 """Represents a parsed WSGI request.
                 Contains both parsed parameters as well as a handle on the input stream.
                 """
                 # Request method.
                 method = attr.ib()
                 # Full URL for this request.
                 url = attr.ib()
                 # URL without any path components. Just <proto>://<host><port>.
                 baseurl = attr.ib()
                 # Advertised URL. Like ``url`` and ``baseurl`` but uses SERVER_NAME instead
                 # of HTTP: Host header for hostname. This is likely what clients used.
                 advertisedurl = attr.ib()
                 advertisedbaseurl = attr.ib()
                 # URL scheme (part before ``://``). e.g. ``http`` or ``https``.
                 urlscheme = attr.ib()
                 # Value of REMOTE_USER, if set, or None.
                 remoteuser = attr.ib()
                 # Value of REMOTE_HOST, if set, or None.
                 remotehost = attr.ib()
                 # WSGI application path.
                 apppath = attr.ib()
                 # List of path parts to be used for dispatch.
                 dispatchparts = attr.ib()
                 # URL path component (no query string) used for dispatch.
                 dispatchpath = attr.ib()
                 # Whether there is a path component to this request. This can be true
                 # when ``dispatchpath`` is empty due to REPO_NAME muckery.
                 havepathinfo = attr.ib()
                 # The name of the repository being accessed.
                 reponame = attr.ib()
                 # Raw query string (part after "?" in URL).
                 querystring = attr.ib()
                 # multidict of query string parameters.
                 qsparams = attr.ib()
                 # wsgiref.headers.Headers instance. Operates like a dict with case
                 # insensitive keys.
                 headers = attr.ib()
                 # Request body input stream.
                 bodyfh = attr.ib()
             def parserequestfromenv(env, bodyfh):
                 """Parse URL components from environment variables.
                 WSGI defines request attributes via environment variables. This function
                 parses the environment variables into a data structure.
                 """
                 # PEP-0333 defines the WSGI spec and is a useful reference for this code.
                 # We first validate that the incoming object conforms with the WSGI spec.
                 # We only want to be dealing with spec-conforming WSGI implementations.
                 # TODO enable this once we fix internal violations.
                 #wsgiref.validate.check_environ(env)
                 # PEP-0333 states that environment keys and values are native strings
                 # (bytes on Python 2 and str on Python 3). The code points for the Unicode
                 # strings on Python 3 must be between \00000-\000FF. We deal with bytes
                 # in Mercurial, so mass convert string keys and values to bytes.
                 if pycompat.ispy3:
                     env = {k.encode('latin-1'): v for k, v in env.iteritems()}
                     env = {k: v.encode('latin-1') if isinstance(v, str) else v
                            for k, v in env.iteritems()}
                 # https://www.python.org/dev/peps/pep-0333/#environ-variables defines
                 # the environment variables.
                 # https://www.python.org/dev/peps/pep-0333/#url-reconstruction defines
                 # how URLs are reconstructed.
                 fullurl = env['wsgi.url_scheme'] + '://'
                 advertisedfullurl = fullurl
                 def addport(s):
                     if env['wsgi.url_scheme'] == 'https':
                         if env['SERVER_PORT'] != '443':
                             s += ':' + env['SERVER_PORT']
                     else:
                         if env['SERVER_PORT'] != '80':
                             s += ':' + env['SERVER_PORT']
                     return s
                 if env.get('HTTP_HOST'):
                     fullurl += env['HTTP_HOST']
                 else:
                     fullurl += env['SERVER_NAME']
                     fullurl = addport(fullurl)
                 advertisedfullurl += env['SERVER_NAME']
                 advertisedfullurl = addport(advertisedfullurl)
                 baseurl = fullurl
                 advertisedbaseurl = advertisedfullurl
                 fullurl += util.urlreq.quote(env.get('SCRIPT_NAME', ''))
                 advertisedfullurl += util.urlreq.quote(env.get('SCRIPT_NAME', ''))
                 fullurl += util.urlreq.quote(env.get('PATH_INFO', ''))
                 advertisedfullurl += util.urlreq.quote(env.get('PATH_INFO', ''))
                 if env.get('QUERY_STRING'):
                     fullurl += '?' + env['QUERY_STRING']
                     advertisedfullurl += '?' + env['QUERY_STRING']
                 # When dispatching requests, we look at the URL components (PATH_INFO
                 # and QUERY_STRING) after the application root (SCRIPT_NAME). But hgwebdir
                 # has the concept of "virtual" repositories. This is defined via REPO_NAME.
                 # If REPO_NAME is defined, we append it to SCRIPT_NAME to form a new app
                 # root. We also exclude its path components from PATH_INFO when resolving
                 # the dispatch path.
-                apppath = env['SCRIPT_NAME']
+                apppath = env.get('SCRIPT_NAME', '')
                 if env.get('REPO_NAME'):
                     if not apppath.endswith('/'):
                         apppath += '/'
                     apppath += env.get('REPO_NAME')
                 if 'PATH_INFO' in env:
                     dispatchparts = env['PATH_INFO'].strip('/').split('/')
                     # Strip out repo parts.
                     repoparts = env.get('REPO_NAME', '').split('/')
                     if dispatchparts[:len(repoparts)] == repoparts:
                         dispatchparts = dispatchparts[len(repoparts):]
                 else:
                     dispatchparts = []
                 dispatchpath = '/'.join(dispatchparts)
                 querystring = env.get('QUERY_STRING', '')
                 # We store as a list so we have ordering information. We also store as
                 # a dict to facilitate fast lookup.
                 qsparams = multidict()
                 for k, v in util.urlreq.parseqsl(querystring, keep_blank_values=True):
                     qsparams.add(k, v)
                 # HTTP_* keys contain HTTP request headers. The Headers structure should
                 # perform case normalization for us. We just rewrite underscore to dash
                 # so keys match what likely went over the wire.
                 headers = []
                 for k, v in env.iteritems():
                     if k.startswith('HTTP_'):
                         headers.append((k[len('HTTP_'):].replace('_', '-'), v))
                 headers = wsgiheaders.Headers(headers)
                 # This is kind of a lie because the HTTP header wasn't explicitly
                 # sent. But for all intents and purposes it should be OK to lie about
                 # this, since a consumer will either either value to determine how many
                 # bytes are available to read.
                 if 'CONTENT_LENGTH' in env and 'HTTP_CONTENT_LENGTH' not in env:
                     headers['Content-Length'] = env['CONTENT_LENGTH']
                 # TODO do this once we remove wsgirequest.inp, otherwise we could have
                 # multiple readers from the underlying input stream.
                 #bodyfh = env['wsgi.input']
                 #if 'Content-Length' in headers:
                 #    bodyfh = util.cappedreader(bodyfh, int(headers['Content-Length']))
                 return parsedrequest(method=env['REQUEST_METHOD'],
                                      url=fullurl, baseurl=baseurl,
                                      advertisedurl=advertisedfullurl,
                                      advertisedbaseurl=advertisedbaseurl,
                                      urlscheme=env['wsgi.url_scheme'],
                                      remoteuser=env.get('REMOTE_USER'),
                                      remotehost=env.get('REMOTE_HOST'),
                                      apppath=apppath,
                                      dispatchparts=dispatchparts, dispatchpath=dispatchpath,
                                      havepathinfo='PATH_INFO' in env,
                                      reponame=env.get('REPO_NAME'),
                                      querystring=querystring,
                                      qsparams=qsparams,
                                      headers=headers,
                                      bodyfh=bodyfh)
             class offsettrackingwriter(object):
                 """A file object like object that is append only and tracks write count.
                 Instances are bound to a callable. This callable is called with data
                 whenever a ``write()`` is attempted.
                 Instances track the amount of written data so they can answer ``tell()``
                 requests.
                 The intent of this class is to wrap the ``write()`` function returned by
                 a WSGI ``start_response()`` function. Since ``write()`` is a callable and
                 not a file object, it doesn't implement other file object methods.
                 """
                 def __init__(self, writefn):
                     self._write = writefn
                     self._offset = 0
                 def write(self, s):
                     res = self._write(s)
                     # Some Python objects don't report the number of bytes written.
                     if res is None:
                         self._offset += len(s)
                     else:
                         self._offset += res
                 def flush(self):
                     pass
                 def tell(self):
                     return self._offset
             class wsgiresponse(object):
                 """Represents a response to a WSGI request.
                 A response consists of a status line, headers, and a body.
                 Consumers must populate the ``status`` and ``headers`` fields and
                 make a call to a ``setbody*()`` method before the response can be
                 issued.
                 When it is time to start sending the response over the wire,
                 ``sendresponse()`` is called. It handles emitting the header portion
                 of the response message. It then yields chunks of body data to be
                 written to the peer. Typically, the WSGI application itself calls
                 and returns the value from ``sendresponse()``.
                 """
                 def __init__(self, req, startresponse):
                     """Create an empty response tied to a specific request.
                     ``req`` is a ``parsedrequest``. ``startresponse`` is the
                     ``start_response`` function passed to the WSGI application.
                     """
                     self._req = req
                     self._startresponse = startresponse
                     self.status = None
                     self.headers = wsgiheaders.Headers([])
                     self._bodybytes = None
                     self._bodygen = None
                     self._bodywillwrite = False
                     self._started = False
                     self._bodywritefn = None
                 def _verifybody(self):
                     if (self._bodybytes is not None or self._bodygen is not None
                         or self._bodywillwrite):
                         raise error.ProgrammingError('cannot define body multiple times')
                 def setbodybytes(self, b):
                     """Define the response body as static bytes.
                     The empty string signals that there is no response body.
                     """
                     self._verifybody()
                     self._bodybytes = b
                     self.headers['Content-Length'] = '%d' % len(b)
                 def setbodygen(self, gen):
                     """Define the response body as a generator of bytes."""
                     self._verifybody()
                     self._bodygen = gen
                 def setbodywillwrite(self):
                     """Signal an intent to use write() to emit the response body.
                     **This is the least preferred way to send a body.**
                     It is preferred for WSGI applications to emit a generator of chunks
                     constituting the response body. However, some consumers can't emit
                     data this way. So, WSGI provides a way to obtain a ``write(data)``
                     function that can be used to synchronously perform an unbuffered
                     write.
                     Calling this function signals an intent to produce the body in this
                     manner.
                     """
                     self._verifybody()
                     self._bodywillwrite = True
                 def sendresponse(self):
                     """Send the generated response to the client.
                     Before this is called, ``status`` must be set and one of
                     ``setbodybytes()`` or ``setbodygen()`` must be called.
                     Calling this method multiple times is not allowed.
                     """
                     if self._started:
                         raise error.ProgrammingError('sendresponse() called multiple times')
                     self._started = True
                     if not self.status:
                         raise error.ProgrammingError('status line not defined')
                     if (self._bodybytes is None and self._bodygen is None
                         and not self._bodywillwrite):
                         raise error.ProgrammingError('response body not defined')
                     # RFC 7232 Section 4.1 states that a 304 MUST generate one of
                     # {Cache-Control, Content-Location, Date, ETag, Expires, Vary}
                     # and SHOULD NOT generate other headers unless they could be used
                     # to guide cache updates. Furthermore, RFC 7230 Section 3.3.2
                     # states that no response body can be issued. Content-Length can
                     # be sent. But if it is present, it should be the size of the response
                     # that wasn't transferred.
                     if self.status.startswith('304 '):
                         # setbodybytes('') will set C-L to 0. This doesn't conform with the
                         # spec. So remove it.
                         if self.headers.get('Content-Length') == '0':
                             del self.headers['Content-Length']
                         # Strictly speaking, this is too strict. But until it causes
                         # problems, let's be strict.
                         badheaders = {k for k in self.headers.keys()
                                       if k.lower() not in ('date', 'etag', 'expires',
                                                            'cache-control',
                                                            'content-location',
                                                            'vary')}
                         if badheaders:
                             raise error.ProgrammingError(
                                 'illegal header on 304 response: %s' %
                                 ', '.join(sorted(badheaders)))
                         if self._bodygen is not None or self._bodywillwrite:
                             raise error.ProgrammingError("must use setbodybytes('') with "
                                                          "304 responses")
                     # Various HTTP clients (notably httplib) won't read the HTTP response
                     # until the HTTP request has been sent in full. If servers (us) send a
                     # response before the HTTP request has been fully sent, the connection
                     # may deadlock because neither end is reading.
                     #
                     # We work around this by "draining" the request data before
                     # sending any response in some conditions.
                     drain = False
                     close = False
                     # If the client sent Expect: 100-continue, we assume it is smart enough
                     # to deal with the server sending a response before reading the request.
                     # (httplib doesn't do this.)
                     if self._req.headers.get('Expect', '').lower() == '100-continue':
                         pass
                     # Only tend to request methods that have bodies. Strictly speaking,
                     # we should sniff for a body. But this is fine for our existing
                     # WSGI applications.
                     elif self._req.method not in ('POST', 'PUT'):
                         pass
                     else:
                         # If we don't know how much data to read, there's no guarantee
                         # that we can drain the request responsibly. The WSGI
                         # specification only says that servers *should* ensure the
                         # input stream doesn't overrun the actual request. So there's
                         # no guarantee that reading until EOF won't corrupt the stream
                         # state.
                         if not isinstance(self._req.bodyfh, util.cappedreader):
                             close = True
                         else:
                             # We /could/ only drain certain HTTP response codes. But 200 and
                             # non-200 wire protocol responses both require draining. Since
                             # we have a capped reader in place for all situations where we
                             # drain, it is safe to read from that stream. We'll either do
                             # a drain or no-op if we're already at EOF.
                             drain = True
                     if close:
                         self.headers['Connection'] = 'Close'
                     if drain:
                         assert isinstance(self._req.bodyfh, util.cappedreader)
                         while True:
                             chunk = self._req.bodyfh.read(32768)
                             if not chunk:
                                 break
                     write = self._startresponse(pycompat.sysstr(self.status),
                                                 self.headers.items())
                     if self._bodybytes:
                         yield self._bodybytes
                     elif self._bodygen:
                         for chunk in self._bodygen:
                             yield chunk
                     elif self._bodywillwrite:
                         self._bodywritefn = write
                     else:
                         error.ProgrammingError('do not know how to send body')
                 def getbodyfile(self):
                     """Obtain a file object like object representing the response body.
                     For this to work, you must call ``setbodywillwrite()`` and then
                     ``sendresponse()`` first. ``sendresponse()`` is a generator and the
                     function won't run to completion unless the generator is advanced. The
                     generator yields not items. The easiest way to consume it is with
                     ``list(res.sendresponse())``, which should resolve to an empty list -
                     ``[]``.
                     """
                     if not self._bodywillwrite:
                         raise error.ProgrammingError('must call setbodywillwrite() first')
                     if not self._started:
                         raise error.ProgrammingError('must call sendresponse() first; did '
                                                      'you remember to consume it since it '
                                                      'is a generator?')
                     assert self._bodywritefn
                     return offsettrackingwriter(self._bodywritefn)
             class wsgirequest(object):
                 """Higher-level API for a WSGI request.
                 WSGI applications are invoked with 2 arguments. They are used to
                 instantiate instances of this class, which provides higher-level APIs
                 for obtaining request parameters, writing HTTP output, etc.
                 """
                 def __init__(self, wsgienv, start_response):
                     version = wsgienv[r'wsgi.version']
                     if (version < (1, 0)) or (version >= (2, 0)):
                         raise RuntimeError("Unknown and unsupported WSGI version %d.%d"
                                            % version)
                     inp = wsgienv[r'wsgi.input']
                     if r'HTTP_CONTENT_LENGTH' in wsgienv:
                         inp = util.cappedreader(inp, int(wsgienv[r'HTTP_CONTENT_LENGTH']))
                     elif r'CONTENT_LENGTH' in wsgienv:
                         inp = util.cappedreader(inp, int(wsgienv[r'CONTENT_LENGTH']))
                     self.err = wsgienv[r'wsgi.errors']
                     self.threaded = wsgienv[r'wsgi.multithread']
                     self.multiprocess = wsgienv[r'wsgi.multiprocess']
                     self.run_once = wsgienv[r'wsgi.run_once']
                     self.env = wsgienv
                     self.req = parserequestfromenv(wsgienv, inp)
                     self.res = wsgiresponse(self.req, start_response)
                     self._start_response = start_response
                     self.server_write = None
                     self.headers = []
                 def respond(self, status, type, filename=None, body=None):
                     if not isinstance(type, str):
                         type = pycompat.sysstr(type)
                     if self._start_response is not None:
                         self.headers.append((r'Content-Type', type))
                         if filename:
                             filename = (filename.rpartition('/')[-1]
                                         .replace('\\', '\\\\').replace('"', '\\"'))
                             self.headers.append(('Content-Disposition',
                                                  'inline; filename="%s"' % filename))
                         if body is not None:
                             self.headers.append((r'Content-Length', str(len(body))))
                         for k, v in self.headers:
                             if not isinstance(v, str):
                                 raise TypeError('header value must be string: %r' % (v,))
                         if isinstance(status, ErrorResponse):
                             self.headers.extend(status.headers)
                             status = statusmessage(status.code, pycompat.bytestr(status))
                         elif status == 200:
                             status = '200 Script output follows'
                         elif isinstance(status, int):
                             status = statusmessage(status)
                         # Various HTTP clients (notably httplib) won't read the HTTP
                         # response until the HTTP request has been sent in full. If servers
                         # (us) send a response before the HTTP request has been fully sent,
                         # the connection may deadlock because neither end is reading.
                         #
                         # We work around this by "draining" the request data before
                         # sending any response in some conditions.
                         drain = False
                         close = False
                         # If the client sent Expect: 100-continue, we assume it is smart
                         # enough to deal with the server sending a response before reading
                         # the request. (httplib doesn't do this.)
                         if self.env.get(r'HTTP_EXPECT', r'').lower() == r'100-continue':
                             pass
                         # Only tend to request methods that have bodies. Strictly speaking,
                         # we should sniff for a body. But this is fine for our existing
                         # WSGI applications.
                         elif self.env[r'REQUEST_METHOD'] not in (r'POST', r'PUT'):
                             pass
                         else:
                             # If we don't know how much data to read, there's no guarantee
                             # that we can drain the request responsibly. The WSGI
                             # specification only says that servers *should* ensure the
                             # input stream doesn't overrun the actual request. So there's
                             # no guarantee that reading until EOF won't corrupt the stream
                             # state.
                             if not isinstance(self.req.bodyfh, util.cappedreader):
                                 close = True
                             else:
                                 # We /could/ only drain certain HTTP response codes. But 200
                                 # and non-200 wire protocol responses both require draining.
                                 # Since we have a capped reader in place for all situations
                                 # where we drain, it is safe to read from that stream. We'll
                                 # either do a drain or no-op if we're already at EOF.
                                 drain = True
                         if close:
                             self.headers.append((r'Connection', r'Close'))
                         if drain:
                             assert isinstance(self.req.bodyfh, util.cappedreader)
                             while True:
                                 chunk = self.req.bodyfh.read(32768)
                                 if not chunk:
                                     break
                         self.server_write = self._start_response(
                             pycompat.sysstr(status), self.headers)
                         self._start_response = None
                         self.headers = []
                     if body is not None:
                         self.write(body)
                         self.server_write = None
                 def write(self, thing):
                     if thing:
                         try:
                             self.server_write(thing)
                         except socket.error as inst:
                             if inst[0] != errno.ECONNRESET:
                                 raise
                 def flush(self):
                     return None
             def wsgiapplication(app_maker):
                 '''For compatibility with old CGI scripts. A plain hgweb() or hgwebdir()
                 can and should now be used as a WSGI application.'''
                 application = app_maker()
                 def run_wsgi(env, respond):
                     return application(env, respond)
                 return run_wsgi