mercurial-scm/hg-stable: mercurial/hgweb/request.py comparison

comparison mercurial/hgweb/request.py @ 36863:da4e2f87167d

hgweb: expose input stream on parsed WSGI request object Our next step towards moving away from wsgirequest to our newer, friendlier parsedrequest type is input stream access. This commit exposes the input stream on the instance. Consumers in the HTTP protocol server switch to it. Because there were very few consumers of the input stream, we stopped storing a reference to the input stream on wsgirequest directly. All access now goes through parsedrequest. However, wsgirequest still may read from this stream as part of cgi.parse(). So we still need to create the stream from wsgirequest. Differential Revision: https://phab.mercurial-scm.org/D2771

author	Gregory Szorc <gregory.szorc@gmail.com>
date	Sat, 10 Mar 2018 11:06:13 -0800
parents	1f7d9024674c
children	01f6bba64424

comparison

equal deleted inserted replaced

-:1f7d9024674c
+:da4e2f87167d
 pycompat.bytesurl(i.strip()) for i in v]
 return bytesform
 @attr.s(frozen=True)
 class parsedrequest(object):
-"""Represents a parsed WSGI request / static HTTP request parameters."""
+"""Represents a parsed WSGI request.
+Contains both parsed parameters as well as a handle on the input stream.
+"""
 # Request method.
 method = attr.ib()
 # Full URL for this request.
 url = attr.ib()
 # Dict of query string arguments. Values are lists with at least 1 item.
 querystringdict = attr.ib()
 # wsgiref.headers.Headers instance. Operates like a dict with case
 # insensitive keys.
 headers = attr.ib()
+# Request body input stream.
-def parserequestfromenv(env):
+bodyfh = attr.ib()
+def parserequestfromenv(env, bodyfh):
 """Parse URL components from environment variables.
 WSGI defines request attributes via environment variables. This function
 parses the environment variables into a data structure.
 """
 # sent. But for all intents and purposes it should be OK to lie about
 # this, since a consumer will either either value to determine how many
 # bytes are available to read.
 if 'CONTENT_LENGTH' in env and 'HTTP_CONTENT_LENGTH' not in env:
 headers['Content-Length'] = env['CONTENT_LENGTH']
+# TODO do this once we remove wsgirequest.inp, otherwise we could have
+# multiple readers from the underlying input stream.
+#bodyfh = env['wsgi.input']
+#if 'Content-Length' in headers:
+#    bodyfh = util.cappedreader(bodyfh, int(headers['Content-Length']))
 return parsedrequest(method=env['REQUEST_METHOD'],
 url=fullurl, baseurl=baseurl,
 advertisedurl=advertisedfullurl,
 advertisedbaseurl=advertisedbaseurl,
 dispatchparts=dispatchparts, dispatchpath=dispatchpath,
 havepathinfo='PATH_INFO' in env,
 querystring=querystring,
 querystringlist=querystringlist,
 querystringdict=querystringdict,
-headers=headers)
+headers=headers,
+bodyfh=bodyfh)
 class wsgirequest(object):
 """Higher-level API for a WSGI request.
 WSGI applications are invoked with 2 arguments. They are used to
 def __init__(self, wsgienv, start_response):
 version = wsgienv[r'wsgi.version']
 if (version < (1, 0)) or (version >= (2, 0)):
 raise RuntimeError("Unknown and unsupported WSGI version %d.%d"
 % version)
-self.inp = wsgienv[r'wsgi.input']
+inp = wsgienv[r'wsgi.input']
 if r'HTTP_CONTENT_LENGTH' in wsgienv:
-self.inp = util.cappedreader(self.inp,
+inp = util.cappedreader(inp, int(wsgienv[r'HTTP_CONTENT_LENGTH']))
-int(wsgienv[r'HTTP_CONTENT_LENGTH']))
 elif r'CONTENT_LENGTH' in wsgienv:
-self.inp = util.cappedreader(self.inp,
+inp = util.cappedreader(inp, int(wsgienv[r'CONTENT_LENGTH']))
-int(wsgienv[r'CONTENT_LENGTH']))
 self.err = wsgienv[r'wsgi.errors']
 self.threaded = wsgienv[r'wsgi.multithread']
 self.multiprocess = wsgienv[r'wsgi.multiprocess']
 self.run_once = wsgienv[r'wsgi.run_once']
 self.env = wsgienv
-self.form = normalize(cgi.parse(self.inp,
+self.form = normalize(cgi.parse(inp,
 self.env,
 keep_blank_values=1))
 self._start_response = start_response
 self.server_write = None
 self.headers = []
-self.req = parserequestfromenv(wsgienv)
+self.req = parserequestfromenv(wsgienv, inp)
 def respond(self, status, type, filename=None, body=None):
 if not isinstance(type, str):
 type = pycompat.sysstr(type)
 if self._start_response is not None:
 # that we can drain the request responsibly. The WSGI
 # specification only says that servers *should* ensure the
 # input stream doesn't overrun the actual request. So there's
 # no guarantee that reading until EOF won't corrupt the stream
 # state.
-if not isinstance(self.inp, util.cappedreader):
+if not isinstance(self.req.bodyfh, util.cappedreader):
 close = True
 else:
 # We /could/ only drain certain HTTP response codes. But 200
 # and non-200 wire protocol responses both require draining.
 # Since we have a capped reader in place for all situations
 if close:
 self.headers.append((r'Connection', r'Close'))
 if drain:
-assert isinstance(self.inp, util.cappedreader)
+assert isinstance(self.req.bodyfh, util.cappedreader)
 while True:
-chunk = self.inp.read(32768)
+chunk = self.req.bodyfh.read(32768)
 if not chunk:
 break
 self.server_write = self._start_response(
 pycompat.sysstr(status), self.headers)

Mercurial > public > mercurial-scm > hg-stable

comparison mercurial/hgweb/request.py @ 36863:da4e2f87167d