Checkpoint commit.

author: Allan Saddi <allan@saddi.com> 2005-04-15 02:55:03 +0000
committer: Allan Saddi <allan@saddi.com> 2005-04-15 02:55:03 +0000
commit: 700071bc26f40727331651b4f273465a4faa0c7d (patch)
tree: 62cb10677bb5e732f29dd807e0dd37307564fc87 /flup/server/scgi.py
parent: e8f091226f39a888c019b1637fb8a47927b8a4ab (diff)
download: flup-700071bc26f40727331651b4f273465a4faa0c7d.tar.gz
1 files changed, 19 insertions, 546 deletions
diff --git a/flup/server/scgi.py b/flup/server/scgi.py
index c4bb20a..f8d0ed5 100644
--- a/flup/server/scgi.py
+++ b/flup/server/scgi.py
@@ -63,327 +63,15 @@ Example wrapper script:
 __author__ = 'Allan Saddi <allan@saddi.com>'
 __version__ = '$Revision$'
 
-import sys
 import logging
 import socket
-import select
-import errno
-import cStringIO as StringIO
-import signal
-import datetime
 
-# Threads are required. If you want a non-threaded (forking) version, look at
-# SWAP <http://www.idyll.org/~t/www-tools/wsgi/>.
-import thread
-import threading
+from scgi_base import BaseSCGIServer, Connection
+from threadedserver import ThreadedServer
 
 __all__ = ['WSGIServer']
 
-# The main classes use this name for logging.
-LoggerName = 'scgi-wsgi'
-
-# Set up module-level logger.
-console = logging.StreamHandler()
-console.setLevel(logging.DEBUG)
-console.setFormatter(logging.Formatter('%(asctime)s : %(message)s',
-                                       '%Y-%m-%d %H:%M:%S'))
-logging.getLogger(LoggerName).addHandler(console)
-del console
-
-class ProtocolError(Exception):
-    """
-    Exception raised when the server does something unexpected or
-    sends garbled data. Usually leads to a Connection closing.
-    """
-    pass
-
-def recvall(sock, length):
-    """
-    Attempts to receive length bytes from a socket, blocking if necessary.
-    (Socket may be blocking or non-blocking.)
-    """
-    dataList = []
-    recvLen = 0
-    while length:
-        try:
-            data = sock.recv(length)
-        except socket.error, e:
-            if e[0] == errno.EAGAIN:
-                select.select([sock], [], [])
-                continue
-            else:
-                raise
-        if not data: # EOF
-            break
-        dataList.append(data)
-        dataLen = len(data)
-        recvLen += dataLen
-        length -= dataLen
-    return ''.join(dataList), recvLen
-
-def readNetstring(sock):
-    """
-    Attempt to read a netstring from a socket.
-    """
-    # First attempt to read the length.
-    size = ''
-    while True:
-        try:
-            c = sock.recv(1)
-        except socket.error, e:
-            if e[0] == errno.EAGAIN:
-                select.select([sock], [], [])
-                continue
-            else:
-                raise
-        if c == ':':
-            break
-        if not c:
-            raise EOFError
-        size += c
-
-    # Try to decode the length.
-    try:
-        size = int(size)
-        if size < 0:
-            raise ValueError
-    except ValueError:
-        raise ProtocolError, 'invalid netstring length'
-
-    # Now read the string.
-    s, length = recvall(sock, size)
-
-    if length < size:
-        raise EOFError
-
-    # Lastly, the trailer.
-    trailer, length = recvall(sock, 1)
-
-    if length < 1:
-        raise EOFError
-
-    if trailer != ',':
-        raise ProtocolError, 'invalid netstring trailer'
-
-    return s
-
-class StdoutWrapper(object):
-    """
-    Wrapper for sys.stdout so we know if data has actually been written.
-    """
-    def __init__(self, stdout):
-        self._file = stdout
-        self.dataWritten = False
-
-    def write(self, data):
-        if data:
-            self.dataWritten = True
-        self._file.write(data)
-
-    def writelines(self, lines):
-        for line in lines:
-            self.write(line)
-
-    def __getattr__(self, name):
-        return getattr(self._file, name)
-
-class Request(object):
-    """
-    Encapsulates data related to a single request.
-
-    Public attributes:
-      environ - Environment variables from web server.
-      stdin - File-like object representing the request body.
-      stdout - File-like object for writing the response.
-    """
-    def __init__(self, conn, environ, input, output):
-        self._conn = conn
-        self.environ = environ
-        self.stdin = input
-        self.stdout = StdoutWrapper(output)
-
-        self.logger = logging.getLogger(LoggerName)
-
-    def run(self):
-        self.logger.info('%s %s%s',
-                         self.environ['REQUEST_METHOD'],
-                         self.environ.get('SCRIPT_NAME', ''),
-                         self.environ.get('PATH_INFO', ''))
-
-        start = datetime.datetime.now()
-
-        try:
-            self._conn.server.handler(self)
-        except:
-            self.logger.exception('Exception caught from handler')
-            if not self.stdout.dataWritten:
-                self._conn.server.error(self)
-
-        end = datetime.datetime.now()
-
-        handlerTime = end - start
-        self.logger.debug('%s %s%s done (%.3f secs)',
-                          self.environ['REQUEST_METHOD'],
-                          self.environ.get('SCRIPT_NAME', ''),
-                          self.environ.get('PATH_INFO', ''),
-                          handlerTime.seconds +
-                          handlerTime.microseconds / 1000000.0)
-
-class Connection(object):
-    """
-    Represents a single client (web server) connection. A single request
-    is handled, after which the socket is closed.
-    """
-    def __init__(self, sock, addr, server):
-        self._sock = sock
-        self._addr = addr
-        self.server = server
-
-        self.logger = logging.getLogger(LoggerName)
-
-    def run(self):
-        self.logger.debug('Connection starting up (%s:%d)',
-                          self._addr[0], self._addr[1])
-
-        try:
-            self.processInput()
-        except EOFError:
-            pass
-        except ProtocolError, e:
-            self.logger.error("Protocol error '%s'", str(e))
-        except:
-            self.logger.exception('Exception caught in Connection')
-
-        self.logger.debug('Connection shutting down (%s:%d)',
-                          self._addr[0], self._addr[1])
-
-        # All done!
-        self._sock.close()
-
-    def processInput(self):
-        # Read headers
-        headers = readNetstring(self._sock)
-        headers = headers.split('\x00')[:-1]
-        if len(headers) % 2 != 0:
-            raise ProtocolError, 'invalid headers'
-        environ = {}
-        for i in range(len(headers) / 2):
-            environ[headers[2*i]] = headers[2*i+1]
-
-        clen = environ.get('CONTENT_LENGTH')
-        if clen is None:
-            raise ProtocolError, 'missing CONTENT_LENGTH'
-        try:
-            clen = int(clen)
-            if clen < 0:
-                raise ValueError
-        except ValueError:
-            raise ProtocolError, 'invalid CONTENT_LENGTH'
-
-        self._sock.setblocking(1)
-        if clen:
-            input = self._sock.makefile('r')
-        else:
-            # Empty input.
-            input = StringIO.StringIO()
-
-        # stdout
-        output = self._sock.makefile('w')
-
-        # Allocate Request
-        req = Request(self, environ, input, output)
-
-        # Run it.
-        req.run()
-
-        output.close()
-        input.close()
-
-class ThreadPool(object):
-    """
-    Thread pool that maintains the number of idle threads between
-    minSpare and maxSpare inclusive. By default, there is no limit on
-    the number of threads that can be started, but this can be controlled
-    by maxThreads.
-    """
-    def __init__(self, minSpare=1, maxSpare=5, maxThreads=sys.maxint):
-        self._minSpare = minSpare
-        self._maxSpare = maxSpare
-        self._maxThreads = max(minSpare, maxThreads)
-
-        self._lock = threading.Condition()
-        self._workQueue = []
-        self._idleCount = self._workerCount = maxSpare
-
-        # Start the minimum number of worker threads.
-        for i in range(maxSpare):
-            thread.start_new_thread(self._worker, ())
-
-    def addJob(self, job, allowQueuing=True):
-        """
-        Adds a job to the work queue. The job object should have a run()
-        method. If allowQueuing is True (the default), the job will be
-        added to the work queue regardless if there are any idle threads
-        ready. (The only way for there to be no idle threads is if maxThreads
-        is some reasonable, finite limit.)
-
-        Otherwise, if allowQueuing is False, and there are no more idle
-        threads, the job will not be queued.
-
-        Returns True if the job was queued, False otherwise.
-        """
-        self._lock.acquire()
-        try:
-            # Maintain minimum number of spares.
-            while self._idleCount < self._minSpare and \
-                  self._workerCount < self._maxThreads:
-                self._workerCount += 1
-                self._idleCount += 1
-                thread.start_new_thread(self._worker, ())
-
-            # Hand off the job.
-            if self._idleCount or allowQueuing:
-                self._workQueue.append(job)
-                self._lock.notify()
-                return True
-            else:
-                return False
-        finally:
-            self._lock.release()
-
-    def _worker(self):
-        """
-        Worker thread routine. Waits for a job, executes it, repeat.
-        """
-        self._lock.acquire()
-        while True:
-            while not self._workQueue:
-                self._lock.wait()
-
-            # We have a job to do...
-            job = self._workQueue.pop(0)
-
-            assert self._idleCount > 0
-            self._idleCount -= 1
-
-            self._lock.release()
-
-            job.run()
-
-            self._lock.acquire()
-
-            if self._idleCount == self._maxSpare:
-                break # NB: lock still held
-            self._idleCount += 1
-            assert self._idleCount <= self._maxSpare
-
-        # Die off...
-        assert self._workerCount > self._maxSpare
-        self._workerCount -= 1
-
-        self._lock.release()
-
-class WSGIServer(object):
+class WSGIServer(BaseSCGIServer, ThreadedServer):
     """
     SCGI/WSGI server. For information about SCGI (Simple Common Gateway
     Interface), see <http://www.mems-exchange.org/software/scgi/>.
@@ -399,9 +87,6 @@ class WSGIServer(object):
     of preforking to be quite superior. So if your application really doesn't
     mind running in multiple processes, go use SWAP. ;)
     """
-    # What Request class to use.
-    requestClass = Request
-
     def __init__(self, application, environ=None,
                  multithreaded=True,
                  bindAddress=('localhost', 4000), allowedServers=None,
@@ -410,8 +95,6 @@ class WSGIServer(object):
         environ, which must be a dictionary, can contain any additional
         environment variables you want to pass to your application.
 
-        Set multithreaded to False if your application is not thread-safe.
-
         bindAddress is the address to bind to, which must be a tuple of
         length 2. The first element is a string, which is the host name
         or IPv4 address of a local interface. The 2nd element is the port
@@ -422,66 +105,24 @@ class WSGIServer(object):
         connections from anywhere.
 
         loggingLevel sets the logging level of the module-level logger.
-
-        Any additional keyword arguments are passed to the underlying
-        ThreadPool.
         """
-        if environ is None:
-            environ = {}
-
-        self.application = application
-        self.environ = environ
-        self.multithreaded = multithreaded
-        self._bindAddress = bindAddress
-        self._allowedServers = allowedServers
-
-        # Used to force single-threadedness.
-        self._appLock = thread.allocate_lock()
-
-        self._threadPool = ThreadPool(**kw)
-
-        self.logger = logging.getLogger(LoggerName)
-        self.logger.setLevel(loggingLevel)
-
-    def _setupSocket(self):
-        """Creates and binds the socket for communication with the server."""
-        sock = socket.socket()
-        sock.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 1)
-        sock.bind(self._bindAddress)
-        sock.listen(socket.SOMAXCONN)
-        return sock
-
-    def _cleanupSocket(self, sock):
-        """Closes the main socket."""
-        sock.close()
-
-    def _isServerAllowed(self, addr):
-        return self._allowedServers is None or \
-               addr[0] in self._allowedServers
-
-    def _installSignalHandlers(self):
-        self._oldSIGs = [(x,signal.getsignal(x)) for x in
-                         (signal.SIGHUP, signal.SIGINT, signal.SIGTERM)]
-        signal.signal(signal.SIGHUP, self._hupHandler)
-        signal.signal(signal.SIGINT, self._intHandler)
-        signal.signal(signal.SIGTERM, self._intHandler)
-
-    def _restoreSignalHandlers(self):
-        for signum,handler in self._oldSIGs:
-            signal.signal(signum, handler)
-        
-    def _hupHandler(self, signum, frame):
-        self._hupReceived = True
-        self._keepGoing = False
-
-    def _intHandler(self, signum, frame):
-        self._keepGoing = False
+        BaseSCGIServer.__init__(self, application,
+                                environ=environ,
+                                multithreaded=multithreaded,
+                                bindAddress=bindAddress,
+                                allowedServers=allowedServers,
+                                loggingLevel=loggingLevel)
+        for key in ('jobClass', 'jobArgs'):
+            if kw.has_key(key):
+                del kw[key]
+        ThreadedServer.__init__(self, jobClass=Connection, jobArgs=(self,),
+                                **kw)
 
-    def run(self, timeout=1.0):
+    def run(self):
         """
         Main loop. Call this after instantiating WSGIServer. SIGHUP, SIGINT,
-        SIGTERM cause it to cleanup and return. (If a SIGHUP is caught, this
-        method returns True. Returns False otherwise.)
+        SIGQUIT, SIGTERM cause it to cleanup and return. (If a SIGHUP
+        is caught, this method returns True. Returns False otherwise.)
         """
         self.logger.info('%s starting up', self.__class__.__name__)
 
@@ -491,182 +132,14 @@ class WSGIServer(object):
             self.logger.error('Failed to bind socket (%s), exiting', e[1])
             return False
 
-        self._keepGoing = True
-        self._hupReceived = False
-
-        # Install signal handlers.
-        self._installSignalHandlers()
-
-        while self._keepGoing:
-            try:
-                r, w, e = select.select([sock], [], [], timeout)
-            except select.error, e:
-                if e[0] == errno.EINTR:
-                    continue
-                raise
-
-            if r:
-                try:
-                    clientSock, addr = sock.accept()
-                except socket.error, e:
-                    if e[0] in (errno.EINTR, errno.EAGAIN):
-                        continue
-                    raise
-
-                if not self._isServerAllowed(addr):
-                    self.logger.warning('Server connection from %s disallowed',
-                                        addr[0])
-                    clientSock.close()
-                    continue
-
-                # Hand off to Connection.
-                conn = Connection(clientSock, addr, self)
-                if not self._threadPool.addJob(conn, allowQueuing=False):
-                    # No thread left, immediately close the socket to hopefully
-                    # indicate to the web server that we're at our limit...
-                    # and to prevent having too many opened (and useless)
-                    # files.
-                    clientSock.close()
-
-            self._mainloopPeriodic()
-
-        # Restore old signal handlers.
-        self._restoreSignalHandlers()
+        ret = ThreadedServer.run(self, sock)
 
         self._cleanupSocket(sock)
 
         self.logger.info('%s shutting down%s', self.__class__.__name__,
                          self._hupReceived and ' (reload requested)' or '')
 
-        return self._hupReceived
-
-    def _mainloopPeriodic(self):
-        """
-        Called with just about each iteration of the main loop. Meant to
-        be overridden.
-        """
-        pass
-
-    def _exit(self, reload=False):
-        """
-        Protected convenience method for subclasses to force an exit. Not
-        really thread-safe, which is why it isn't public.
-        """
-        if self._keepGoing:
-            self._keepGoing = False
-            self._hupReceived = reload
-
-    def handler(self, request):
-        """
-        WSGI handler. Sets up WSGI environment, calls the application,
-        and sends the application's response.
-        """
-        environ = request.environ
-        environ.update(self.environ)
-
-        environ['wsgi.version'] = (1,0)
-        environ['wsgi.input'] = request.stdin
-        environ['wsgi.errors'] = sys.stderr
-        environ['wsgi.multithread'] = self.multithreaded
-        # AFAIK, the current mod_scgi does not do load-balancing/fail-over.
-        # So a single application deployment will only run in one process
-        # at a time, on this server.
-        environ['wsgi.multiprocess'] = False
-        environ['wsgi.run_once'] = False
-
-        if environ.get('HTTPS', 'off') in ('on', '1'):
-            environ['wsgi.url_scheme'] = 'https'
-        else:
-            environ['wsgi.url_scheme'] = 'http'
-
-        headers_set = []
-        headers_sent = []
-        result = None
-
-        def write(data):
-            assert type(data) is str, 'write() argument must be string'
-            assert headers_set, 'write() before start_response()'
-
-            if not headers_sent:
-                status, responseHeaders = headers_sent[:] = headers_set
-                found = False
-                for header,value in responseHeaders:
-                    if header.lower() == 'content-length':
-                        found = True
-                        break
-                if not found and result is not None:
-                    try:
-                        if len(result) == 1:
-                            responseHeaders.append(('Content-Length',
-                                                    str(len(data))))
-                    except:
-                        pass
-                s = 'Status: %s\r\n' % status
-                for header in responseHeaders:
-                    s += '%s: %s\r\n' % header
-                s += '\r\n'
-                try:
-                    request.stdout.write(s)
-                except socket.error, e:
-                    if e[0] != errno.EPIPE:
-                        raise
-
-            try:
-                request.stdout.write(data)
-                request.stdout.flush()
-            except socket.error, e:
-                if e[0] != errno.EPIPE:
-                    raise
-
-        def start_response(status, response_headers, exc_info=None):
-            if exc_info:
-                try:
-                    if headers_sent:
-                        # Re-raise if too late
-                        raise exc_info[0], exc_info[1], exc_info[2]
-                finally:
-                    exc_info = None # avoid dangling circular ref
-            else:
-                assert not headers_set, 'Headers already set!'
-
-            assert type(status) is str, 'Status must be a string'
-            assert len(status) >= 4, 'Status must be at least 4 characters'
-            assert int(status[:3]), 'Status must begin with 3-digit code'
-            assert status[3] == ' ', 'Status must have a space after code'
-            assert type(response_headers) is list, 'Headers must be a list'
-            if __debug__:
-                for name,val in response_headers:
-                    assert type(name) is str, 'Header names must be strings'
-                    assert type(val) is str, 'Header values must be strings'
-
-            headers_set[:] = [status, response_headers]
-            return write
-
-        if not self.multithreaded:
-            self._appLock.acquire()
-        try:
-            result = self.application(environ, start_response)
-            try:
-                for data in result:
-                    if data:
-                        write(data)
-                if not headers_sent:
-                    write('') # in case body was empty
-            finally:
-                if hasattr(result, 'close'):
-                    result.close()
-        finally:
-            if not self.multithreaded:
-                self._appLock.release()
-
-    def error(self, request):
-        """
-        Override to provide custom error handling. Ideally, however,
-        all errors should be caught at the application level.
-        """
-        import cgitb
-        request.stdout.write('Content-Type: text/html\r\n\r\n' +
-                             cgitb.html(sys.exc_info()))
+        return ret
 
 if __name__ == '__main__':
     def test_app(environ, start_response):
author	Allan Saddi <allan@saddi.com>	2005-04-15 02:55:03 +0000
committer	Allan Saddi <allan@saddi.com>	2005-04-15 02:55:03 +0000
commit	700071bc26f40727331651b4f273465a4faa0c7d (patch)
tree	62cb10677bb5e732f29dd807e0dd37307564fc87 /flup/server/scgi.py
parent	e8f091226f39a888c019b1637fb8a47927b8a4ab (diff)
download	flup-700071bc26f40727331651b4f273465a4faa0c7d.tar.gz