| """Base classes for server/gateway implementations""" | 
 |  | 
 | from .util import FileWrapper, guess_scheme, is_hop_by_hop | 
 | from .headers import Headers | 
 |  | 
 | import sys, os, time | 
 |  | 
 | __all__ = [ | 
 |     'BaseHandler', 'SimpleHandler', 'BaseCGIHandler', 'CGIHandler', | 
 |     'IISCGIHandler', 'read_environ' | 
 | ] | 
 |  | 
 | # Weekday and month names for HTTP date/time formatting; always English! | 
 | _weekdayname = ["Mon", "Tue", "Wed", "Thu", "Fri", "Sat", "Sun"] | 
 | _monthname = [None, # Dummy so we can use 1-based month numbers | 
 |               "Jan", "Feb", "Mar", "Apr", "May", "Jun", | 
 |               "Jul", "Aug", "Sep", "Oct", "Nov", "Dec"] | 
 |  | 
 | def format_date_time(timestamp): | 
 |     year, month, day, hh, mm, ss, wd, y, z = time.gmtime(timestamp) | 
 |     return "%s, %02d %3s %4d %02d:%02d:%02d GMT" % ( | 
 |         _weekdayname[wd], day, _monthname[month], year, hh, mm, ss | 
 |     ) | 
 |  | 
 | _is_request = { | 
 |     'SCRIPT_NAME', 'PATH_INFO', 'QUERY_STRING', 'REQUEST_METHOD', 'AUTH_TYPE', | 
 |     'CONTENT_TYPE', 'CONTENT_LENGTH', 'HTTPS', 'REMOTE_USER', 'REMOTE_IDENT', | 
 | }.__contains__ | 
 |  | 
 | def _needs_transcode(k): | 
 |     return _is_request(k) or k.startswith('HTTP_') or k.startswith('SSL_') \ | 
 |         or (k.startswith('REDIRECT_') and _needs_transcode(k[9:])) | 
 |  | 
 | def read_environ(): | 
 |     """Read environment, fixing HTTP variables""" | 
 |     enc = sys.getfilesystemencoding() | 
 |     esc = 'surrogateescape' | 
 |     try: | 
 |         ''.encode('utf-8', esc) | 
 |     except LookupError: | 
 |         esc = 'replace' | 
 |     environ = {} | 
 |  | 
 |     # Take the basic environment from native-unicode os.environ. Attempt to | 
 |     # fix up the variables that come from the HTTP request to compensate for | 
 |     # the bytes->unicode decoding step that will already have taken place. | 
 |     for k, v in os.environ.items(): | 
 |         if _needs_transcode(k): | 
 |  | 
 |             # On win32, the os.environ is natively Unicode. Different servers | 
 |             # decode the request bytes using different encodings. | 
 |             if sys.platform == 'win32': | 
 |                 software = os.environ.get('SERVER_SOFTWARE', '').lower() | 
 |  | 
 |                 # On IIS, the HTTP request will be decoded as UTF-8 as long | 
 |                 # as the input is a valid UTF-8 sequence. Otherwise it is | 
 |                 # decoded using the system code page (mbcs), with no way to | 
 |                 # detect this has happened. Because UTF-8 is the more likely | 
 |                 # encoding, and mbcs is inherently unreliable (an mbcs string | 
 |                 # that happens to be valid UTF-8 will not be decoded as mbcs) | 
 |                 # always recreate the original bytes as UTF-8. | 
 |                 if software.startswith('microsoft-iis/'): | 
 |                     v = v.encode('utf-8').decode('iso-8859-1') | 
 |  | 
 |                 # Apache mod_cgi writes bytes-as-unicode (as if ISO-8859-1) direct | 
 |                 # to the Unicode environ. No modification needed. | 
 |                 elif software.startswith('apache/'): | 
 |                     pass | 
 |  | 
 |                 # Python 3's http.server.CGIHTTPRequestHandler decodes | 
 |                 # using the urllib.unquote default of UTF-8, amongst other | 
 |                 # issues. | 
 |                 elif ( | 
 |                     software.startswith('simplehttp/') | 
 |                     and 'python/3' in software | 
 |                 ): | 
 |                     v = v.encode('utf-8').decode('iso-8859-1') | 
 |  | 
 |                 # For other servers, guess that they have written bytes to | 
 |                 # the environ using stdio byte-oriented interfaces, ending up | 
 |                 # with the system code page. | 
 |                 else: | 
 |                     v = v.encode(enc, 'replace').decode('iso-8859-1') | 
 |  | 
 |             # Recover bytes from unicode environ, using surrogate escapes | 
 |             # where available (Python 3.1+). | 
 |             else: | 
 |                 v = v.encode(enc, esc).decode('iso-8859-1') | 
 |  | 
 |         environ[k] = v | 
 |     return environ | 
 |  | 
 |  | 
 | class BaseHandler: | 
 |     """Manage the invocation of a WSGI application""" | 
 |  | 
 |     # Configuration parameters; can override per-subclass or per-instance | 
 |     wsgi_version = (1,0) | 
 |     wsgi_multithread = True | 
 |     wsgi_multiprocess = True | 
 |     wsgi_run_once = False | 
 |  | 
 |     origin_server = True    # We are transmitting direct to client | 
 |     http_version  = "1.0"   # Version that should be used for response | 
 |     server_software = None  # String name of server software, if any | 
 |  | 
 |     # os_environ is used to supply configuration from the OS environment: | 
 |     # by default it's a copy of 'os.environ' as of import time, but you can | 
 |     # override this in e.g. your __init__ method. | 
 |     os_environ= read_environ() | 
 |  | 
 |     # Collaborator classes | 
 |     wsgi_file_wrapper = FileWrapper     # set to None to disable | 
 |     headers_class = Headers             # must be a Headers-like class | 
 |  | 
 |     # Error handling (also per-subclass or per-instance) | 
 |     traceback_limit = None  # Print entire traceback to self.get_stderr() | 
 |     error_status = "500 Internal Server Error" | 
 |     error_headers = [('Content-Type','text/plain')] | 
 |     error_body = b"A server error occurred.  Please contact the administrator." | 
 |  | 
 |     # State variables (don't mess with these) | 
 |     status = result = None | 
 |     headers_sent = False | 
 |     headers = None | 
 |     bytes_sent = 0 | 
 |  | 
 |     def run(self, application): | 
 |         """Invoke the application""" | 
 |         # Note to self: don't move the close()!  Asynchronous servers shouldn't | 
 |         # call close() from finish_response(), so if you close() anywhere but | 
 |         # the double-error branch here, you'll break asynchronous servers by | 
 |         # prematurely closing.  Async servers must return from 'run()' without | 
 |         # closing if there might still be output to iterate over. | 
 |         try: | 
 |             self.setup_environ() | 
 |             self.result = application(self.environ, self.start_response) | 
 |             self.finish_response() | 
 |         except: | 
 |             try: | 
 |                 self.handle_error() | 
 |             except: | 
 |                 # If we get an error handling an error, just give up already! | 
 |                 self.close() | 
 |                 raise   # ...and let the actual server figure it out. | 
 |  | 
 |  | 
 |     def setup_environ(self): | 
 |         """Set up the environment for one request""" | 
 |  | 
 |         env = self.environ = self.os_environ.copy() | 
 |         self.add_cgi_vars() | 
 |  | 
 |         env['wsgi.input']        = self.get_stdin() | 
 |         env['wsgi.errors']       = self.get_stderr() | 
 |         env['wsgi.version']      = self.wsgi_version | 
 |         env['wsgi.run_once']     = self.wsgi_run_once | 
 |         env['wsgi.url_scheme']   = self.get_scheme() | 
 |         env['wsgi.multithread']  = self.wsgi_multithread | 
 |         env['wsgi.multiprocess'] = self.wsgi_multiprocess | 
 |  | 
 |         if self.wsgi_file_wrapper is not None: | 
 |             env['wsgi.file_wrapper'] = self.wsgi_file_wrapper | 
 |  | 
 |         if self.origin_server and self.server_software: | 
 |             env.setdefault('SERVER_SOFTWARE',self.server_software) | 
 |  | 
 |  | 
 |     def finish_response(self): | 
 |         """Send any iterable data, then close self and the iterable | 
 |  | 
 |         Subclasses intended for use in asynchronous servers will | 
 |         want to redefine this method, such that it sets up callbacks | 
 |         in the event loop to iterate over the data, and to call | 
 |         'self.close()' once the response is finished. | 
 |         """ | 
 |         try: | 
 |             if not self.result_is_file() or not self.sendfile(): | 
 |                 for data in self.result: | 
 |                     self.write(data) | 
 |                 self.finish_content() | 
 |         finally: | 
 |             self.close() | 
 |  | 
 |  | 
 |     def get_scheme(self): | 
 |         """Return the URL scheme being used""" | 
 |         return guess_scheme(self.environ) | 
 |  | 
 |  | 
 |     def set_content_length(self): | 
 |         """Compute Content-Length or switch to chunked encoding if possible""" | 
 |         try: | 
 |             blocks = len(self.result) | 
 |         except (TypeError,AttributeError,NotImplementedError): | 
 |             pass | 
 |         else: | 
 |             if blocks==1: | 
 |                 self.headers['Content-Length'] = str(self.bytes_sent) | 
 |                 return | 
 |         # XXX Try for chunked encoding if origin server and client is 1.1 | 
 |  | 
 |  | 
 |     def cleanup_headers(self): | 
 |         """Make any necessary header changes or defaults | 
 |  | 
 |         Subclasses can extend this to add other defaults. | 
 |         """ | 
 |         if 'Content-Length' not in self.headers: | 
 |             self.set_content_length() | 
 |  | 
 |     def start_response(self, status, headers,exc_info=None): | 
 |         """'start_response()' callable as specified by PEP 3333""" | 
 |  | 
 |         if exc_info: | 
 |             try: | 
 |                 if self.headers_sent: | 
 |                     # Re-raise original exception if headers sent | 
 |                     raise exc_info[0](exc_info[1]).with_traceback(exc_info[2]) | 
 |             finally: | 
 |                 exc_info = None        # avoid dangling circular ref | 
 |         elif self.headers is not None: | 
 |             raise AssertionError("Headers already set!") | 
 |  | 
 |         self.status = status | 
 |         self.headers = self.headers_class(headers) | 
 |         status = self._convert_string_type(status, "Status") | 
 |         assert len(status)>=4,"Status must be at least 4 characters" | 
 |         assert int(status[:3]),"Status message must begin w/3-digit code" | 
 |         assert status[3]==" ", "Status message must have a space after code" | 
 |  | 
 |         if __debug__: | 
 |             for name, val in headers: | 
 |                 name = self._convert_string_type(name, "Header name") | 
 |                 val = self._convert_string_type(val, "Header value") | 
 |                 assert not is_hop_by_hop(name),"Hop-by-hop headers not allowed" | 
 |  | 
 |         return self.write | 
 |  | 
 |     def _convert_string_type(self, value, title): | 
 |         """Convert/check value type.""" | 
 |         if type(value) is str: | 
 |             return value | 
 |         raise AssertionError( | 
 |             "{0} must be of type str (got {1})".format(title, repr(value)) | 
 |         ) | 
 |  | 
 |     def send_preamble(self): | 
 |         """Transmit version/status/date/server, via self._write()""" | 
 |         if self.origin_server: | 
 |             if self.client_is_modern(): | 
 |                 self._write(('HTTP/%s %s\r\n' % (self.http_version,self.status)).encode('iso-8859-1')) | 
 |                 if 'Date' not in self.headers: | 
 |                     self._write( | 
 |                         ('Date: %s\r\n' % format_date_time(time.time())).encode('iso-8859-1') | 
 |                     ) | 
 |                 if self.server_software and 'Server' not in self.headers: | 
 |                     self._write(('Server: %s\r\n' % self.server_software).encode('iso-8859-1')) | 
 |         else: | 
 |             self._write(('Status: %s\r\n' % self.status).encode('iso-8859-1')) | 
 |  | 
 |     def write(self, data): | 
 |         """'write()' callable as specified by PEP 3333""" | 
 |  | 
 |         assert type(data) is bytes, \ | 
 |             "write() argument must be a bytes instance" | 
 |  | 
 |         if not self.status: | 
 |             raise AssertionError("write() before start_response()") | 
 |  | 
 |         elif not self.headers_sent: | 
 |             # Before the first output, send the stored headers | 
 |             self.bytes_sent = len(data)    # make sure we know content-length | 
 |             self.send_headers() | 
 |         else: | 
 |             self.bytes_sent += len(data) | 
 |  | 
 |         # XXX check Content-Length and truncate if too many bytes written? | 
 |         self._write(data) | 
 |         self._flush() | 
 |  | 
 |  | 
 |     def sendfile(self): | 
 |         """Platform-specific file transmission | 
 |  | 
 |         Override this method in subclasses to support platform-specific | 
 |         file transmission.  It is only called if the application's | 
 |         return iterable ('self.result') is an instance of | 
 |         'self.wsgi_file_wrapper'. | 
 |  | 
 |         This method should return a true value if it was able to actually | 
 |         transmit the wrapped file-like object using a platform-specific | 
 |         approach.  It should return a false value if normal iteration | 
 |         should be used instead.  An exception can be raised to indicate | 
 |         that transmission was attempted, but failed. | 
 |  | 
 |         NOTE: this method should call 'self.send_headers()' if | 
 |         'self.headers_sent' is false and it is going to attempt direct | 
 |         transmission of the file. | 
 |         """ | 
 |         return False   # No platform-specific transmission by default | 
 |  | 
 |  | 
 |     def finish_content(self): | 
 |         """Ensure headers and content have both been sent""" | 
 |         if not self.headers_sent: | 
 |             # Only zero Content-Length if not set by the application (so | 
 |             # that HEAD requests can be satisfied properly, see #3839) | 
 |             self.headers.setdefault('Content-Length', "0") | 
 |             self.send_headers() | 
 |         else: | 
 |             pass # XXX check if content-length was too short? | 
 |  | 
 |     def close(self): | 
 |         """Close the iterable (if needed) and reset all instance vars | 
 |  | 
 |         Subclasses may want to also drop the client connection. | 
 |         """ | 
 |         try: | 
 |             if hasattr(self.result,'close'): | 
 |                 self.result.close() | 
 |         finally: | 
 |             self.result = self.headers = self.status = self.environ = None | 
 |             self.bytes_sent = 0; self.headers_sent = False | 
 |  | 
 |  | 
 |     def send_headers(self): | 
 |         """Transmit headers to the client, via self._write()""" | 
 |         self.cleanup_headers() | 
 |         self.headers_sent = True | 
 |         if not self.origin_server or self.client_is_modern(): | 
 |             self.send_preamble() | 
 |             self._write(bytes(self.headers)) | 
 |  | 
 |  | 
 |     def result_is_file(self): | 
 |         """True if 'self.result' is an instance of 'self.wsgi_file_wrapper'""" | 
 |         wrapper = self.wsgi_file_wrapper | 
 |         return wrapper is not None and isinstance(self.result,wrapper) | 
 |  | 
 |  | 
 |     def client_is_modern(self): | 
 |         """True if client can accept status and headers""" | 
 |         return self.environ['SERVER_PROTOCOL'].upper() != 'HTTP/0.9' | 
 |  | 
 |  | 
 |     def log_exception(self,exc_info): | 
 |         """Log the 'exc_info' tuple in the server log | 
 |  | 
 |         Subclasses may override to retarget the output or change its format. | 
 |         """ | 
 |         try: | 
 |             from traceback import print_exception | 
 |             stderr = self.get_stderr() | 
 |             print_exception( | 
 |                 exc_info[0], exc_info[1], exc_info[2], | 
 |                 self.traceback_limit, stderr | 
 |             ) | 
 |             stderr.flush() | 
 |         finally: | 
 |             exc_info = None | 
 |  | 
 |     def handle_error(self): | 
 |         """Log current error, and send error output to client if possible""" | 
 |         self.log_exception(sys.exc_info()) | 
 |         if not self.headers_sent: | 
 |             self.result = self.error_output(self.environ, self.start_response) | 
 |             self.finish_response() | 
 |         # XXX else: attempt advanced recovery techniques for HTML or text? | 
 |  | 
 |     def error_output(self, environ, start_response): | 
 |         """WSGI mini-app to create error output | 
 |  | 
 |         By default, this just uses the 'error_status', 'error_headers', | 
 |         and 'error_body' attributes to generate an output page.  It can | 
 |         be overridden in a subclass to dynamically generate diagnostics, | 
 |         choose an appropriate message for the user's preferred language, etc. | 
 |  | 
 |         Note, however, that it's not recommended from a security perspective to | 
 |         spit out diagnostics to any old user; ideally, you should have to do | 
 |         something special to enable diagnostic output, which is why we don't | 
 |         include any here! | 
 |         """ | 
 |         start_response(self.error_status,self.error_headers[:],sys.exc_info()) | 
 |         return [self.error_body] | 
 |  | 
 |  | 
 |     # Pure abstract methods; *must* be overridden in subclasses | 
 |  | 
 |     def _write(self,data): | 
 |         """Override in subclass to buffer data for send to client | 
 |  | 
 |         It's okay if this method actually transmits the data; BaseHandler | 
 |         just separates write and flush operations for greater efficiency | 
 |         when the underlying system actually has such a distinction. | 
 |         """ | 
 |         raise NotImplementedError | 
 |  | 
 |     def _flush(self): | 
 |         """Override in subclass to force sending of recent '_write()' calls | 
 |  | 
 |         It's okay if this method is a no-op (i.e., if '_write()' actually | 
 |         sends the data. | 
 |         """ | 
 |         raise NotImplementedError | 
 |  | 
 |     def get_stdin(self): | 
 |         """Override in subclass to return suitable 'wsgi.input'""" | 
 |         raise NotImplementedError | 
 |  | 
 |     def get_stderr(self): | 
 |         """Override in subclass to return suitable 'wsgi.errors'""" | 
 |         raise NotImplementedError | 
 |  | 
 |     def add_cgi_vars(self): | 
 |         """Override in subclass to insert CGI variables in 'self.environ'""" | 
 |         raise NotImplementedError | 
 |  | 
 |  | 
 | class SimpleHandler(BaseHandler): | 
 |     """Handler that's just initialized with streams, environment, etc. | 
 |  | 
 |     This handler subclass is intended for synchronous HTTP/1.0 origin servers, | 
 |     and handles sending the entire response output, given the correct inputs. | 
 |  | 
 |     Usage:: | 
 |  | 
 |         handler = SimpleHandler( | 
 |             inp,out,err,env, multithread=False, multiprocess=True | 
 |         ) | 
 |         handler.run(app)""" | 
 |  | 
 |     def __init__(self,stdin,stdout,stderr,environ, | 
 |         multithread=True, multiprocess=False | 
 |     ): | 
 |         self.stdin = stdin | 
 |         self.stdout = stdout | 
 |         self.stderr = stderr | 
 |         self.base_env = environ | 
 |         self.wsgi_multithread = multithread | 
 |         self.wsgi_multiprocess = multiprocess | 
 |  | 
 |     def get_stdin(self): | 
 |         return self.stdin | 
 |  | 
 |     def get_stderr(self): | 
 |         return self.stderr | 
 |  | 
 |     def add_cgi_vars(self): | 
 |         self.environ.update(self.base_env) | 
 |  | 
 |     def _write(self,data): | 
 |         self.stdout.write(data) | 
 |  | 
 |     def _flush(self): | 
 |         self.stdout.flush() | 
 |         self._flush = self.stdout.flush | 
 |  | 
 |  | 
 | class BaseCGIHandler(SimpleHandler): | 
 |  | 
 |     """CGI-like systems using input/output/error streams and environ mapping | 
 |  | 
 |     Usage:: | 
 |  | 
 |         handler = BaseCGIHandler(inp,out,err,env) | 
 |         handler.run(app) | 
 |  | 
 |     This handler class is useful for gateway protocols like ReadyExec and | 
 |     FastCGI, that have usable input/output/error streams and an environment | 
 |     mapping.  It's also the base class for CGIHandler, which just uses | 
 |     sys.stdin, os.environ, and so on. | 
 |  | 
 |     The constructor also takes keyword arguments 'multithread' and | 
 |     'multiprocess' (defaulting to 'True' and 'False' respectively) to control | 
 |     the configuration sent to the application.  It sets 'origin_server' to | 
 |     False (to enable CGI-like output), and assumes that 'wsgi.run_once' is | 
 |     False. | 
 |     """ | 
 |  | 
 |     origin_server = False | 
 |  | 
 |  | 
 | class CGIHandler(BaseCGIHandler): | 
 |  | 
 |     """CGI-based invocation via sys.stdin/stdout/stderr and os.environ | 
 |  | 
 |     Usage:: | 
 |  | 
 |         CGIHandler().run(app) | 
 |  | 
 |     The difference between this class and BaseCGIHandler is that it always | 
 |     uses 'wsgi.run_once' of 'True', 'wsgi.multithread' of 'False', and | 
 |     'wsgi.multiprocess' of 'True'.  It does not take any initialization | 
 |     parameters, but always uses 'sys.stdin', 'os.environ', and friends. | 
 |  | 
 |     If you need to override any of these parameters, use BaseCGIHandler | 
 |     instead. | 
 |     """ | 
 |  | 
 |     wsgi_run_once = True | 
 |     # Do not allow os.environ to leak between requests in Google App Engine | 
 |     # and other multi-run CGI use cases.  This is not easily testable. | 
 |     # See http://bugs.python.org/issue7250 | 
 |     os_environ = {} | 
 |  | 
 |     def __init__(self): | 
 |         BaseCGIHandler.__init__( | 
 |             self, sys.stdin.buffer, sys.stdout.buffer, sys.stderr, | 
 |             read_environ(), multithread=False, multiprocess=True | 
 |         ) | 
 |  | 
 |  | 
 | class IISCGIHandler(BaseCGIHandler): | 
 |     """CGI-based invocation with workaround for IIS path bug | 
 |  | 
 |     This handler should be used in preference to CGIHandler when deploying on | 
 |     Microsoft IIS without having set the config allowPathInfo option (IIS>=7) | 
 |     or metabase allowPathInfoForScriptMappings (IIS<7). | 
 |     """ | 
 |     wsgi_run_once = True | 
 |     os_environ = {} | 
 |  | 
 |     # By default, IIS gives a PATH_INFO that duplicates the SCRIPT_NAME at | 
 |     # the front, causing problems for WSGI applications that wish to implement | 
 |     # routing. This handler strips any such duplicated path. | 
 |  | 
 |     # IIS can be configured to pass the correct PATH_INFO, but this causes | 
 |     # another bug where PATH_TRANSLATED is wrong. Luckily this variable is | 
 |     # rarely used and is not guaranteed by WSGI. On IIS<7, though, the | 
 |     # setting can only be made on a vhost level, affecting all other script | 
 |     # mappings, many of which break when exposed to the PATH_TRANSLATED bug. | 
 |     # For this reason IIS<7 is almost never deployed with the fix. (Even IIS7 | 
 |     # rarely uses it because there is still no UI for it.) | 
 |  | 
 |     # There is no way for CGI code to tell whether the option was set, so a | 
 |     # separate handler class is provided. | 
 |     def __init__(self): | 
 |         environ= read_environ() | 
 |         path = environ.get('PATH_INFO', '') | 
 |         script = environ.get('SCRIPT_NAME', '') | 
 |         if (path+'/').startswith(script+'/'): | 
 |             environ['PATH_INFO'] = path[len(script):] | 
 |         BaseCGIHandler.__init__( | 
 |             self, sys.stdin.buffer, sys.stdout.buffer, sys.stderr, | 
 |             environ, multithread=False, multiprocess=True | 
 |         ) |